diff --git "a/wandb/run-20220302_041332-j5suzd56/files/wandb-summary.json" "b/wandb/run-20220302_041332-j5suzd56/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220302_041332-j5suzd56/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.5069, "train/learning_rate": 5.92e-05, "train/epoch": 1.0, "train/global_step": 297, "_runtime": 4742, "_timestamp": 1646199154, "_step": 297, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 117.0, 651.0, 234.0, 12.0], "bins": [-389.90692138671875, -383.5785827636719, -377.250244140625, -370.92193603515625, -364.5935974121094, -358.2652587890625, -351.93695068359375, -345.6086120605469, -339.2802734375, -332.9519348144531, -326.62359619140625, -320.2952880859375, -313.9669494628906, -307.63861083984375, -301.310302734375, -294.9819641113281, -288.65362548828125, -282.3252868652344, -275.9969482421875, -269.66864013671875, -263.3403015136719, -257.011962890625, -250.6836395263672, -244.35531616210938, -238.0269775390625, -231.69863891601562, -225.3703155517578, -219.0419921875, -212.71365356445312, -206.38531494140625, -200.05699157714844, -193.72866821289062, -187.4003448486328, -181.072021484375, -174.74368286132812, -168.41534423828125, -162.08702087402344, -155.75869750976562, -149.43035888671875, -143.10202026367188, -136.77369689941406, -130.44537353515625, -124.11703491210938, -117.78870391845703, -111.46037292480469, -105.13204193115234, -98.8037109375, -92.47537994384766, -86.14704132080078, -79.81871032714844, -73.4903793334961, -67.16204833984375, -60.833717346191406, -54.50538635253906, -48.17705535888672, -41.848724365234375, -35.5203971862793, -29.192066192626953, -22.86373519897461, -16.535404205322266, -10.207073211669922, -3.878742218017578, 2.4495887756347656, 8.77791976928711, 15.10625171661377]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 13.0, 8.0, 17.0, 21.0, 14.0, 26.0, 32.0, 17.0, 43.0, 55.0, 40.0, 43.0, 49.0, 46.0, 60.0, 54.0, 56.0, 54.0, 39.0, 34.0, 43.0, 28.0, 33.0, 20.0, 27.0, 17.0, 27.0, 9.0, 9.0, 14.0, 12.0, 4.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-62.19386291503906, -60.59320068359375, -58.99253845214844, -57.391876220703125, -55.79121398925781, -54.1905517578125, -52.58988571166992, -50.98922348022461, -49.3885612487793, -47.787899017333984, -46.18723678588867, -44.58657455444336, -42.98590850830078, -41.38524627685547, -39.784584045410156, -38.183921813964844, -36.58325958251953, -34.98259735107422, -33.381935119628906, -31.78127098083496, -30.18060874938965, -28.579946517944336, -26.97928237915039, -25.378620147705078, -23.777957916259766, -22.177295684814453, -20.57663345336914, -18.975969314575195, -17.375307083129883, -15.77464485168457, -14.173981666564941, -12.573318481445312, -10.972652435302734, -9.371990203857422, -7.771327018737793, -6.170664310455322, -4.570001602172852, -2.969339370727539, -1.3686761856079102, 0.23198699951171875, 1.8326492309570312, 3.433311939239502, 5.033974647521973, 6.634637355804443, 8.235300064086914, 9.835962295532227, 11.436625480651855, 13.037288665771484, 14.637950897216797, 16.23861312866211, 17.839275360107422, 19.439939498901367, 21.04060173034668, 22.641263961791992, 24.241928100585938, 25.84259033203125, 27.443252563476562, 29.043914794921875, 30.644577026367188, 32.2452392578125, 33.84590148925781, 35.446563720703125, 37.0472297668457, 38.647891998291016, 40.24855422973633]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 5.0, 10.0, 9.0, 10.0, 15.0, 19.0, 15.0, 15.0, 29.0, 28.0, 36.0, 52.0, 40.0, 49.0, 40.0, 49.0, 48.0, 70.0, 56.0, 36.0, 48.0, 37.0, 31.0, 37.0, 32.0, 34.0, 21.0, 22.0, 21.0, 23.0, 10.0, 15.0, 12.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.24615478515625, -2.1641845703125, -2.08221435546875, -2.000244140625, -1.91827392578125, -1.8363037109375, -1.75433349609375, -1.67236328125, -1.59039306640625, -1.5084228515625, -1.42645263671875, -1.344482421875, -1.26251220703125, -1.1805419921875, -1.09857177734375, -1.0166015625, -0.93463134765625, -0.8526611328125, -0.77069091796875, -0.688720703125, -0.60675048828125, -0.5247802734375, -0.44281005859375, -0.36083984375, -0.27886962890625, -0.1968994140625, -0.11492919921875, -0.032958984375, 0.04901123046875, 0.1309814453125, 0.21295166015625, 0.294921875, 0.37689208984375, 0.4588623046875, 0.54083251953125, 0.622802734375, 0.70477294921875, 0.7867431640625, 0.86871337890625, 0.95068359375, 1.03265380859375, 1.1146240234375, 1.19659423828125, 1.278564453125, 1.36053466796875, 1.4425048828125, 1.52447509765625, 1.6064453125, 1.68841552734375, 1.7703857421875, 1.85235595703125, 1.934326171875, 2.01629638671875, 2.0982666015625, 2.18023681640625, 2.26220703125, 2.34417724609375, 2.4261474609375, 2.50811767578125, 2.590087890625, 2.67205810546875, 2.7540283203125, 2.83599853515625, 2.91796875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 5.0, 9.0, 5.0, 15.0, 22.0, 37.0, 64.0, 90.0, 162.0, 276.0, 457.0, 891.0, 1726.0, 4247.0, 14065.0, 78326.0, 901183.0, 2831164.0, 309275.0, 37287.0, 8841.0, 3094.0, 1379.0, 698.0, 425.0, 240.0, 120.0, 61.0, 51.0, 23.0, 13.0, 17.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.84619140625, -10.5205078125, -10.19482421875, -9.869140625, -9.54345703125, -9.2177734375, -8.89208984375, -8.56640625, -8.24072265625, -7.9150390625, -7.58935546875, -7.263671875, -6.93798828125, -6.6123046875, -6.28662109375, -5.9609375, -5.63525390625, -5.3095703125, -4.98388671875, -4.658203125, -4.33251953125, -4.0068359375, -3.68115234375, -3.35546875, -3.02978515625, -2.7041015625, -2.37841796875, -2.052734375, -1.72705078125, -1.4013671875, -1.07568359375, -0.75, -0.42431640625, -0.0986328125, 0.22705078125, 0.552734375, 0.87841796875, 1.2041015625, 1.52978515625, 1.85546875, 2.18115234375, 2.5068359375, 2.83251953125, 3.158203125, 3.48388671875, 3.8095703125, 4.13525390625, 4.4609375, 4.78662109375, 5.1123046875, 5.43798828125, 5.763671875, 6.08935546875, 6.4150390625, 6.74072265625, 7.06640625, 7.39208984375, 7.7177734375, 8.04345703125, 8.369140625, 8.69482421875, 9.0205078125, 9.34619140625, 9.671875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 10.0, 6.0, 15.0, 22.0, 26.0, 41.0, 59.0, 84.0, 125.0, 149.0, 261.0, 360.0, 456.0, 540.0, 512.0, 435.0, 292.0, 202.0, 143.0, 122.0, 65.0, 45.0, 35.0, 21.0, 11.0, 12.0, 3.0, 8.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-12.609375, -12.2742919921875, -11.939208984375, -11.6041259765625, -11.26904296875, -10.9339599609375, -10.598876953125, -10.2637939453125, -9.9287109375, -9.5936279296875, -9.258544921875, -8.9234619140625, -8.58837890625, -8.2532958984375, -7.918212890625, -7.5831298828125, -7.248046875, -6.9129638671875, -6.577880859375, -6.2427978515625, -5.90771484375, -5.5726318359375, -5.237548828125, -4.9024658203125, -4.5673828125, -4.2322998046875, -3.897216796875, -3.5621337890625, -3.22705078125, -2.8919677734375, -2.556884765625, -2.2218017578125, -1.88671875, -1.5516357421875, -1.216552734375, -0.8814697265625, -0.54638671875, -0.2113037109375, 0.123779296875, 0.4588623046875, 0.7939453125, 1.1290283203125, 1.464111328125, 1.7991943359375, 2.13427734375, 2.4693603515625, 2.804443359375, 3.1395263671875, 3.474609375, 3.8096923828125, 4.144775390625, 4.4798583984375, 4.81494140625, 5.1500244140625, 5.485107421875, 5.8201904296875, 6.1552734375, 6.4903564453125, 6.825439453125, 7.1605224609375, 7.49560546875, 7.8306884765625, 8.165771484375, 8.5008544921875, 8.8359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 6.0, 13.0, 10.0, 14.0, 21.0, 49.0, 67.0, 100.0, 159.0, 269.0, 450.0, 858.0, 1879.0, 6225.0, 174344.0, 3887694.0, 112843.0, 5511.0, 1755.0, 846.0, 470.0, 240.0, 154.0, 107.0, 50.0, 35.0, 35.0, 17.0, 12.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.65625, -35.52685546875, -34.3974609375, -33.26806640625, -32.138671875, -31.00927734375, -29.8798828125, -28.75048828125, -27.62109375, -26.49169921875, -25.3623046875, -24.23291015625, -23.103515625, -21.97412109375, -20.8447265625, -19.71533203125, -18.5859375, -17.45654296875, -16.3271484375, -15.19775390625, -14.068359375, -12.93896484375, -11.8095703125, -10.68017578125, -9.55078125, -8.42138671875, -7.2919921875, -6.16259765625, -5.033203125, -3.90380859375, -2.7744140625, -1.64501953125, -0.515625, 0.61376953125, 1.7431640625, 2.87255859375, 4.001953125, 5.13134765625, 6.2607421875, 7.39013671875, 8.51953125, 9.64892578125, 10.7783203125, 11.90771484375, 13.037109375, 14.16650390625, 15.2958984375, 16.42529296875, 17.5546875, 18.68408203125, 19.8134765625, 20.94287109375, 22.072265625, 23.20166015625, 24.3310546875, 25.46044921875, 26.58984375, 27.71923828125, 28.8486328125, 29.97802734375, 31.107421875, 32.23681640625, 33.3662109375, 34.49560546875, 35.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 21.0, 81.0, 209.0, 340.0, 227.0, 107.0, 21.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.21906280517578, -78.64128112792969, -76.06349182128906, -73.48571014404297, -70.90792846679688, -68.33013916015625, -65.75235748291016, -63.17457580566406, -60.5967903137207, -58.019004821777344, -55.44122314453125, -52.86343765258789, -50.28565216064453, -47.70787048339844, -45.13008499145508, -42.55229949951172, -39.974517822265625, -37.396732330322266, -34.81895065307617, -32.24116516113281, -29.663381576538086, -27.08559799194336, -24.5078125, -21.930028915405273, -19.352245330810547, -16.77446174621582, -14.196677207946777, -11.618892669677734, -9.041109085083008, -6.463325500488281, -3.8855409622192383, -1.3077564239501953, 1.2700347900390625, 3.8478188514709473, 6.425602912902832, 9.003387451171875, 11.581171035766602, 14.158954620361328, 16.736740112304688, 19.314523696899414, 21.89230728149414, 24.470090866088867, 27.047874450683594, 29.625659942626953, 32.20344543457031, 34.781227111816406, 37.359012603759766, 39.936798095703125, 42.51457977294922, 45.09236526489258, 47.67014694213867, 50.24793243408203, 52.825714111328125, 55.403499603271484, 57.981285095214844, 60.55906677246094, 63.1368522644043, 65.71463775634766, 68.29241943359375, 70.87020111083984, 73.44799041748047, 76.02577209472656, 78.60355377197266, 81.18134307861328, 83.75912475585938]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 7.0, 8.0, 12.0, 14.0, 23.0, 19.0, 25.0, 25.0, 25.0, 32.0, 38.0, 33.0, 42.0, 40.0, 33.0, 42.0, 43.0, 46.0, 43.0, 58.0, 49.0, 42.0, 40.0, 35.0, 40.0, 29.0, 29.0, 24.0, 17.0, 18.0, 16.0, 6.0, 7.0, 13.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.706695556640625, -31.624561309814453, -30.54242515563965, -29.460290908813477, -28.378154754638672, -27.2960205078125, -26.213886260986328, -25.131752014160156, -24.04961585998535, -22.96748161315918, -21.885345458984375, -20.803211212158203, -19.72107696533203, -18.638940811157227, -17.556806564331055, -16.47467041015625, -15.392536163330078, -14.31040096282959, -13.228265762329102, -12.14613151550293, -11.063996315002441, -9.981861114501953, -8.899726867675781, -7.817591667175293, -6.735456466674805, -5.653321266174316, -4.571186542510986, -3.489051580429077, -2.406916618347168, -1.3247814178466797, -0.2426466941833496, 0.8394880294799805, 1.9216194152832031, 3.0037543773651123, 4.0858893394470215, 5.168024063110352, 6.25015926361084, 7.332294464111328, 8.4144287109375, 9.496563911437988, 10.578699111938477, 11.660834312438965, 12.742969512939453, 13.825103759765625, 14.907238960266113, 15.989374160766602, 17.071508407592773, 18.153644561767578, 19.23577880859375, 20.317913055419922, 21.400049209594727, 22.4821834564209, 23.564319610595703, 24.646453857421875, 25.728588104248047, 26.81072235107422, 27.892858505249023, 28.974992752075195, 30.05712890625, 31.139263153076172, 32.221397399902344, 33.30353546142578, 34.38566970825195, 35.467803955078125, 36.5499382019043]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 7.0, 9.0, 13.0, 13.0, 15.0, 27.0, 22.0, 14.0, 29.0, 28.0, 34.0, 31.0, 36.0, 47.0, 52.0, 38.0, 50.0, 49.0, 50.0, 36.0, 37.0, 41.0, 44.0, 36.0, 35.0, 31.0, 22.0, 23.0, 24.0, 14.0, 19.0, 13.0, 15.0, 8.0, 8.0, 3.0, 7.0, 6.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.376953125, -2.296905517578125, -2.21685791015625, -2.136810302734375, -2.0567626953125, -1.976715087890625, -1.89666748046875, -1.816619873046875, -1.736572265625, -1.656524658203125, -1.57647705078125, -1.496429443359375, -1.4163818359375, -1.336334228515625, -1.25628662109375, -1.176239013671875, -1.09619140625, -1.016143798828125, -0.93609619140625, -0.856048583984375, -0.7760009765625, -0.695953369140625, -0.61590576171875, -0.535858154296875, -0.455810546875, -0.375762939453125, -0.29571533203125, -0.215667724609375, -0.1356201171875, -0.055572509765625, 0.02447509765625, 0.104522705078125, 0.1845703125, 0.264617919921875, 0.34466552734375, 0.424713134765625, 0.5047607421875, 0.584808349609375, 0.66485595703125, 0.744903564453125, 0.824951171875, 0.904998779296875, 0.98504638671875, 1.065093994140625, 1.1451416015625, 1.225189208984375, 1.30523681640625, 1.385284423828125, 1.46533203125, 1.545379638671875, 1.62542724609375, 1.705474853515625, 1.7855224609375, 1.865570068359375, 1.94561767578125, 2.025665283203125, 2.105712890625, 2.185760498046875, 2.26580810546875, 2.345855712890625, 2.4259033203125, 2.505950927734375, 2.58599853515625, 2.666046142578125, 2.74609375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 7.0, 13.0, 19.0, 33.0, 37.0, 51.0, 82.0, 113.0, 177.0, 260.0, 377.0, 572.0, 924.0, 1476.0, 2330.0, 3580.0, 5862.0, 9807.0, 16274.0, 27015.0, 45356.0, 74976.0, 122388.0, 190473.0, 202971.0, 134488.0, 82778.0, 50038.0, 30008.0, 17856.0, 10728.0, 6481.0, 4057.0, 2418.0, 1547.0, 995.0, 715.0, 422.0, 249.0, 191.0, 128.0, 80.0, 59.0, 32.0, 37.0, 18.0, 17.0, 14.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.2022705078125, -0.1959686279296875, -0.189666748046875, -0.1833648681640625, -0.17706298828125, -0.1707611083984375, -0.164459228515625, -0.1581573486328125, -0.15185546875, -0.1455535888671875, -0.139251708984375, -0.1329498291015625, -0.12664794921875, -0.1203460693359375, -0.114044189453125, -0.1077423095703125, -0.1014404296875, -0.0951385498046875, -0.088836669921875, -0.0825347900390625, -0.07623291015625, -0.0699310302734375, -0.063629150390625, -0.0573272705078125, -0.051025390625, -0.0447235107421875, -0.038421630859375, -0.0321197509765625, -0.02581787109375, -0.0195159912109375, -0.013214111328125, -0.0069122314453125, -0.0006103515625, 0.0056915283203125, 0.011993408203125, 0.0182952880859375, 0.02459716796875, 0.0308990478515625, 0.037200927734375, 0.0435028076171875, 0.0498046875, 0.0561065673828125, 0.062408447265625, 0.0687103271484375, 0.07501220703125, 0.0813140869140625, 0.087615966796875, 0.0939178466796875, 0.1002197265625, 0.1065216064453125, 0.112823486328125, 0.1191253662109375, 0.12542724609375, 0.1317291259765625, 0.138031005859375, 0.1443328857421875, 0.150634765625, 0.1569366455078125, 0.163238525390625, 0.1695404052734375, 0.17584228515625, 0.1821441650390625, 0.188446044921875, 0.1947479248046875, 0.2010498046875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 10.0, 6.0, 7.0, 7.0, 14.0, 15.0, 24.0, 18.0, 29.0, 32.0, 32.0, 37.0, 36.0, 34.0, 48.0, 38.0, 49.0, 54.0, 1059.0, 52.0, 46.0, 38.0, 41.0, 42.0, 29.0, 26.0, 29.0, 17.0, 22.0, 30.0, 20.0, 18.0, 14.0, 12.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3583984375, -1.3083343505859375, -1.258270263671875, -1.2082061767578125, -1.15814208984375, -1.1080780029296875, -1.058013916015625, -1.0079498291015625, -0.9578857421875, -0.9078216552734375, -0.857757568359375, -0.8076934814453125, -0.75762939453125, -0.7075653076171875, -0.657501220703125, -0.6074371337890625, -0.557373046875, -0.5073089599609375, -0.457244873046875, -0.4071807861328125, -0.35711669921875, -0.3070526123046875, -0.256988525390625, -0.2069244384765625, -0.1568603515625, -0.1067962646484375, -0.056732177734375, -0.0066680908203125, 0.04339599609375, 0.0934600830078125, 0.143524169921875, 0.1935882568359375, 0.24365234375, 0.2937164306640625, 0.343780517578125, 0.3938446044921875, 0.44390869140625, 0.4939727783203125, 0.544036865234375, 0.5941009521484375, 0.6441650390625, 0.6942291259765625, 0.744293212890625, 0.7943572998046875, 0.84442138671875, 0.8944854736328125, 0.944549560546875, 0.9946136474609375, 1.044677734375, 1.0947418212890625, 1.144805908203125, 1.1948699951171875, 1.24493408203125, 1.2949981689453125, 1.345062255859375, 1.3951263427734375, 1.4451904296875, 1.4952545166015625, 1.545318603515625, 1.5953826904296875, 1.64544677734375, 1.6955108642578125, 1.745574951171875, 1.7956390380859375, 1.845703125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 5.0, 18.0, 18.0, 18.0, 40.0, 58.0, 89.0, 115.0, 195.0, 270.0, 404.0, 592.0, 859.0, 1228.0, 1790.0, 2628.0, 3764.0, 5535.0, 7963.0, 11863.0, 17369.0, 25599.0, 37847.0, 55897.0, 82904.0, 118622.0, 1117951.0, 238714.0, 115932.0, 80122.0, 53969.0, 36531.0, 24699.0, 16596.0, 11580.0, 7968.0, 5506.0, 3708.0, 2545.0, 1790.0, 1247.0, 830.0, 571.0, 381.0, 235.0, 174.0, 130.0, 97.0, 48.0, 47.0, 22.0, 20.0, 18.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1290283203125, -0.12486076354980469, -0.12069320678710938, -0.11652565002441406, -0.11235809326171875, -0.10819053649902344, -0.10402297973632812, -0.09985542297363281, -0.0956878662109375, -0.09152030944824219, -0.08735275268554688, -0.08318519592285156, -0.07901763916015625, -0.07485008239746094, -0.07068252563476562, -0.06651496887207031, -0.062347412109375, -0.05817985534667969, -0.054012298583984375, -0.04984474182128906, -0.04567718505859375, -0.04150962829589844, -0.037342071533203125, -0.03317451477050781, -0.0290069580078125, -0.024839401245117188, -0.020671844482421875, -0.016504287719726562, -0.01233673095703125, -0.008169174194335938, -0.004001617431640625, 0.0001659393310546875, 0.00433349609375, 0.008501052856445312, 0.012668609619140625, 0.016836166381835938, 0.02100372314453125, 0.025171279907226562, 0.029338836669921875, 0.03350639343261719, 0.0376739501953125, 0.04184150695800781, 0.046009063720703125, 0.05017662048339844, 0.05434417724609375, 0.05851173400878906, 0.06267929077148438, 0.06684684753417969, 0.071014404296875, 0.07518196105957031, 0.07934951782226562, 0.08351707458496094, 0.08768463134765625, 0.09185218811035156, 0.09601974487304688, 0.10018730163574219, 0.1043548583984375, 0.10852241516113281, 0.11268997192382812, 0.11685752868652344, 0.12102508544921875, 0.12519264221191406, 0.12936019897460938, 0.1335277557373047, 0.1376953125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 5.0, 8.0, 8.0, 6.0, 16.0, 3.0, 6.0, 14.0, 14.0, 21.0, 25.0, 36.0, 34.0, 47.0, 35.0, 55.0, 52.0, 50.0, 38.0, 48.0, 43.0, 56.0, 55.0, 36.0, 45.0, 45.0, 28.0, 27.0, 23.0, 12.0, 22.0, 18.0, 10.0, 11.0, 13.0, 6.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005435943603515625, -0.0005276650190353394, -0.0005117356777191162, -0.0004958063364028931, -0.0004798769950866699, -0.0004639476537704468, -0.00044801831245422363, -0.0004320889711380005, -0.00041615962982177734, -0.0004002302885055542, -0.00038430094718933105, -0.0003683716058731079, -0.00035244226455688477, -0.0003365129232406616, -0.0003205835819244385, -0.00030465424060821533, -0.0002887248992919922, -0.00027279555797576904, -0.0002568662166595459, -0.00024093687534332275, -0.0002250075340270996, -0.00020907819271087646, -0.00019314885139465332, -0.00017721951007843018, -0.00016129016876220703, -0.0001453608274459839, -0.00012943148612976074, -0.0001135021448135376, -9.757280349731445e-05, -8.164346218109131e-05, -6.571412086486816e-05, -4.978477954864502e-05, -3.3855438232421875e-05, -1.792609691619873e-05, -1.996755599975586e-06, 1.3932585716247559e-05, 2.9861927032470703e-05, 4.579126834869385e-05, 6.172060966491699e-05, 7.764995098114014e-05, 9.357929229736328e-05, 0.00010950863361358643, 0.00012543797492980957, 0.00014136731624603271, 0.00015729665756225586, 0.000173225998878479, 0.00018915534019470215, 0.0002050846815109253, 0.00022101402282714844, 0.00023694336414337158, 0.0002528727054595947, 0.00026880204677581787, 0.000284731388092041, 0.00030066072940826416, 0.0003165900707244873, 0.00033251941204071045, 0.0003484487533569336, 0.00036437809467315674, 0.0003803074359893799, 0.00039623677730560303, 0.00041216611862182617, 0.0004280954599380493, 0.00044402480125427246, 0.0004599541425704956, 0.00047588348388671875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 6.0, 0.0, 7.0, 6.0, 7.0, 8.0, 12.0, 13.0, 24.0, 21.0, 22.0, 31.0, 37.0, 31.0, 46.0, 62.0, 72.0, 94.0, 118.0, 165.0, 196.0, 230.0, 385.0, 821.0, 23234.0, 1018160.0, 2672.0, 617.0, 326.0, 217.0, 186.0, 137.0, 112.0, 87.0, 58.0, 56.0, 50.0, 52.0, 36.0, 28.0, 26.0, 20.0, 17.0, 16.0, 10.0, 10.0, 7.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.00925445556640625, -0.008968234062194824, -0.008682012557983398, -0.008395791053771973, -0.008109569549560547, -0.007823348045349121, -0.007537126541137695, -0.0072509050369262695, -0.006964683532714844, -0.006678462028503418, -0.006392240524291992, -0.006106019020080566, -0.005819797515869141, -0.005533576011657715, -0.005247354507446289, -0.004961133003234863, -0.0046749114990234375, -0.004388689994812012, -0.004102468490600586, -0.00381624698638916, -0.0035300254821777344, -0.0032438039779663086, -0.002957582473754883, -0.002671360969543457, -0.0023851394653320312, -0.0020989179611206055, -0.0018126964569091797, -0.001526474952697754, -0.0012402534484863281, -0.0009540319442749023, -0.0006678104400634766, -0.0003815889358520508, -9.5367431640625e-05, 0.00019085407257080078, 0.00047707557678222656, 0.0007632970809936523, 0.0010495185852050781, 0.001335740089416504, 0.0016219615936279297, 0.0019081830978393555, 0.0021944046020507812, 0.002480626106262207, 0.002766847610473633, 0.0030530691146850586, 0.0033392906188964844, 0.00362551212310791, 0.003911733627319336, 0.004197955131530762, 0.0044841766357421875, 0.004770398139953613, 0.005056619644165039, 0.005342841148376465, 0.005629062652587891, 0.005915284156799316, 0.006201505661010742, 0.006487727165222168, 0.006773948669433594, 0.0070601701736450195, 0.007346391677856445, 0.007632613182067871, 0.007918834686279297, 0.008205056190490723, 0.008491277694702148, 0.008777499198913574, 0.009063720703125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 34.0, 844.0, 135.0, 1.0], "bins": [-0.0048851193860173225, -0.004805841017514467, -0.004726562183350325, -0.004647283814847469, -0.004568005446344614, -0.004488727077841759, -0.004409448243677616, -0.004330169875174761, -0.0042508915066719055, -0.00417161313816905, -0.004092334304004908, -0.004013055935502052, -0.003933777566999197, -0.003854498965665698, -0.0037752205971628428, -0.003695941995829344, -0.003616663394495845, -0.003537384793162346, -0.0034581064246594906, -0.0033788278233259916, -0.0032995494548231363, -0.0032202708534896374, -0.003140992484986782, -0.003061713883653283, -0.002982435282319784, -0.002903156680986285, -0.00282387831248343, -0.002744599711149931, -0.0026653213426470757, -0.0025860427413135767, -0.0025067643728107214, -0.0024274857714772224, -0.0023482071701437235, -0.0022689285688102245, -0.0021896502003073692, -0.0021103715989738703, -0.002031093230471015, -0.001951814629137516, -0.001872536144219339, -0.0017932576593011618, -0.0017139792907983065, -0.0016347008058801293, -0.0015554223209619522, -0.001476143836043775, -0.001396865351125598, -0.001317586749792099, -0.0012383082648739219, -0.0011590297799557447, -0.0010797512950375676, -0.0010004728101193905, -0.0009211943252012134, -0.0008419157820753753, -0.0007626372971571982, -0.0006833588122390211, -0.000604080269113183, -0.0005248017841950059, -0.00044552329927682877, -0.00036624481435865164, -0.00028696630033664405, -0.0002076878008665517, -0.00012840930139645934, -4.913081647828221e-05, 3.014769754372537e-05, 0.00010942621156573296, 0.0001887047110358253]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 7.0, 3.0, 7.0, 16.0, 9.0, 16.0, 11.0, 11.0, 10.0, 18.0, 22.0, 30.0, 32.0, 43.0, 23.0, 35.0, 34.0, 43.0, 40.0, 41.0, 32.0, 36.0, 37.0, 28.0, 36.0, 29.0, 36.0, 40.0, 29.0, 29.0, 17.0, 20.0, 18.0, 32.0, 13.0, 25.0, 14.0, 9.0, 12.0, 5.0, 9.0, 8.0, 5.0, 9.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027430057525634766, -0.0002656802535057068, -0.0002570599317550659, -0.00024843961000442505, -0.00023981928825378418, -0.0002311989665031433, -0.00022257864475250244, -0.00021395832300186157, -0.0002053380012512207, -0.00019671767950057983, -0.00018809735774993896, -0.0001794770359992981, -0.00017085671424865723, -0.00016223639249801636, -0.0001536160707473755, -0.00014499574899673462, -0.00013637542724609375, -0.00012775510549545288, -0.00011913478374481201, -0.00011051446199417114, -0.00010189414024353027, -9.32738184928894e-05, -8.465349674224854e-05, -7.603317499160767e-05, -6.74128532409668e-05, -5.879253149032593e-05, -5.017220973968506e-05, -4.155188798904419e-05, -3.293156623840332e-05, -2.431124448776245e-05, -1.5690922737121582e-05, -7.070600986480713e-06, 1.5497207641601562e-06, 1.0170042514801025e-05, 1.8790364265441895e-05, 2.7410686016082764e-05, 3.603100776672363e-05, 4.46513295173645e-05, 5.327165126800537e-05, 6.189197301864624e-05, 7.051229476928711e-05, 7.913261651992798e-05, 8.775293827056885e-05, 9.637326002120972e-05, 0.00010499358177185059, 0.00011361390352249146, 0.00012223422527313232, 0.0001308545470237732, 0.00013947486877441406, 0.00014809519052505493, 0.0001567155122756958, 0.00016533583402633667, 0.00017395615577697754, 0.0001825764775276184, 0.00019119679927825928, 0.00019981712102890015, 0.00020843744277954102, 0.00021705776453018188, 0.00022567808628082275, 0.00023429840803146362, 0.0002429187297821045, 0.00025153905153274536, 0.00026015937328338623, 0.0002687796950340271, 0.00027740001678466797]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 7.0, 9.0, 13.0, 13.0, 15.0, 27.0, 22.0, 14.0, 29.0, 28.0, 34.0, 31.0, 36.0, 47.0, 52.0, 38.0, 50.0, 49.0, 50.0, 36.0, 37.0, 41.0, 44.0, 36.0, 35.0, 31.0, 22.0, 23.0, 24.0, 14.0, 19.0, 13.0, 15.0, 8.0, 8.0, 3.0, 7.0, 6.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.376953125, -2.296905517578125, -2.21685791015625, -2.136810302734375, -2.0567626953125, -1.976715087890625, -1.89666748046875, -1.816619873046875, -1.736572265625, -1.656524658203125, -1.57647705078125, -1.496429443359375, -1.4163818359375, -1.336334228515625, -1.25628662109375, -1.176239013671875, -1.09619140625, -1.016143798828125, -0.93609619140625, -0.856048583984375, -0.7760009765625, -0.695953369140625, -0.61590576171875, -0.535858154296875, -0.455810546875, -0.375762939453125, -0.29571533203125, -0.215667724609375, -0.1356201171875, -0.055572509765625, 0.02447509765625, 0.104522705078125, 0.1845703125, 0.264617919921875, 0.34466552734375, 0.424713134765625, 0.5047607421875, 0.584808349609375, 0.66485595703125, 0.744903564453125, 0.824951171875, 0.904998779296875, 0.98504638671875, 1.065093994140625, 1.1451416015625, 1.225189208984375, 1.30523681640625, 1.385284423828125, 1.46533203125, 1.545379638671875, 1.62542724609375, 1.705474853515625, 1.7855224609375, 1.865570068359375, 1.94561767578125, 2.025665283203125, 2.105712890625, 2.185760498046875, 2.26580810546875, 2.345855712890625, 2.4259033203125, 2.505950927734375, 2.58599853515625, 2.666046142578125, 2.74609375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 2.0, 5.0, 9.0, 14.0, 30.0, 34.0, 44.0, 58.0, 82.0, 122.0, 151.0, 212.0, 290.0, 391.0, 591.0, 731.0, 1107.0, 1483.0, 2214.0, 3087.0, 4795.0, 7646.0, 13639.0, 29917.0, 92708.0, 331696.0, 374486.0, 109682.0, 34039.0, 15059.0, 8122.0, 4997.0, 3308.0, 2169.0, 1558.0, 1115.0, 827.0, 599.0, 420.0, 320.0, 245.0, 155.0, 112.0, 82.0, 63.0, 50.0, 28.0, 22.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.78515625, -6.57354736328125, -6.3619384765625, -6.15032958984375, -5.938720703125, -5.72711181640625, -5.5155029296875, -5.30389404296875, -5.09228515625, -4.88067626953125, -4.6690673828125, -4.45745849609375, -4.245849609375, -4.03424072265625, -3.8226318359375, -3.61102294921875, -3.3994140625, -3.18780517578125, -2.9761962890625, -2.76458740234375, -2.552978515625, -2.34136962890625, -2.1297607421875, -1.91815185546875, -1.70654296875, -1.49493408203125, -1.2833251953125, -1.07171630859375, -0.860107421875, -0.64849853515625, -0.4368896484375, -0.22528076171875, -0.013671875, 0.19793701171875, 0.4095458984375, 0.62115478515625, 0.832763671875, 1.04437255859375, 1.2559814453125, 1.46759033203125, 1.67919921875, 1.89080810546875, 2.1024169921875, 2.31402587890625, 2.525634765625, 2.73724365234375, 2.9488525390625, 3.16046142578125, 3.3720703125, 3.58367919921875, 3.7952880859375, 4.00689697265625, 4.218505859375, 4.43011474609375, 4.6417236328125, 4.85333251953125, 5.06494140625, 5.27655029296875, 5.4881591796875, 5.69976806640625, 5.911376953125, 6.12298583984375, 6.3345947265625, 6.54620361328125, 6.7578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 7.0, 6.0, 6.0, 13.0, 10.0, 10.0, 4.0, 24.0, 18.0, 15.0, 24.0, 19.0, 30.0, 26.0, 31.0, 33.0, 53.0, 54.0, 84.0, 150.0, 223.0, 1314.0, 244.0, 143.0, 97.0, 51.0, 51.0, 40.0, 30.0, 37.0, 32.0, 23.0, 19.0, 19.0, 23.0, 18.0, 13.0, 15.0, 8.0, 7.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.49609375, -7.27294921875, -7.0498046875, -6.82666015625, -6.603515625, -6.38037109375, -6.1572265625, -5.93408203125, -5.7109375, -5.48779296875, -5.2646484375, -5.04150390625, -4.818359375, -4.59521484375, -4.3720703125, -4.14892578125, -3.92578125, -3.70263671875, -3.4794921875, -3.25634765625, -3.033203125, -2.81005859375, -2.5869140625, -2.36376953125, -2.140625, -1.91748046875, -1.6943359375, -1.47119140625, -1.248046875, -1.02490234375, -0.8017578125, -0.57861328125, -0.35546875, -0.13232421875, 0.0908203125, 0.31396484375, 0.537109375, 0.76025390625, 0.9833984375, 1.20654296875, 1.4296875, 1.65283203125, 1.8759765625, 2.09912109375, 2.322265625, 2.54541015625, 2.7685546875, 2.99169921875, 3.21484375, 3.43798828125, 3.6611328125, 3.88427734375, 4.107421875, 4.33056640625, 4.5537109375, 4.77685546875, 5.0, 5.22314453125, 5.4462890625, 5.66943359375, 5.892578125, 6.11572265625, 6.3388671875, 6.56201171875, 6.78515625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 10.0, 10.0, 14.0, 14.0, 12.0, 23.0, 22.0, 30.0, 34.0, 34.0, 47.0, 71.0, 112.0, 218.0, 613.0, 2778.0, 358014.0, 2774986.0, 6927.0, 889.0, 288.0, 142.0, 100.0, 57.0, 37.0, 26.0, 30.0, 18.0, 24.0, 18.0, 17.0, 11.0, 7.0, 9.0, 15.0, 4.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.25, -25.349853515625, -24.44970703125, -23.549560546875, -22.6494140625, -21.749267578125, -20.84912109375, -19.948974609375, -19.048828125, -18.148681640625, -17.24853515625, -16.348388671875, -15.4482421875, -14.548095703125, -13.64794921875, -12.747802734375, -11.84765625, -10.947509765625, -10.04736328125, -9.147216796875, -8.2470703125, -7.346923828125, -6.44677734375, -5.546630859375, -4.646484375, -3.746337890625, -2.84619140625, -1.946044921875, -1.0458984375, -0.145751953125, 0.75439453125, 1.654541015625, 2.5546875, 3.454833984375, 4.35498046875, 5.255126953125, 6.1552734375, 7.055419921875, 7.95556640625, 8.855712890625, 9.755859375, 10.656005859375, 11.55615234375, 12.456298828125, 13.3564453125, 14.256591796875, 15.15673828125, 16.056884765625, 16.95703125, 17.857177734375, 18.75732421875, 19.657470703125, 20.5576171875, 21.457763671875, 22.35791015625, 23.258056640625, 24.158203125, 25.058349609375, 25.95849609375, 26.858642578125, 27.7587890625, 28.658935546875, 29.55908203125, 30.459228515625, 31.359375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 11.0, 887.0, 118.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.46012878417969, -73.2244873046875, -66.98884582519531, -60.75320816040039, -54.5175666809082, -48.281925201416016, -42.046287536621094, -35.810646057128906, -29.57500457763672, -23.33936309814453, -17.103723526000977, -10.868083953857422, -4.632442474365234, 1.6031990051269531, 7.838836669921875, 14.074478149414062, 20.31011962890625, 26.545761108398438, 32.781402587890625, 39.01704025268555, 45.252681732177734, 51.48832321166992, 57.723960876464844, 63.95960235595703, 70.19524383544922, 76.4308853149414, 82.6665267944336, 88.90216064453125, 95.13780212402344, 101.37344360351562, 107.60908508300781, 113.8447265625, 120.08038330078125, 126.31602478027344, 132.55166625976562, 138.7873077392578, 145.02294921875, 151.2585906982422, 157.49423217773438, 163.7298583984375, 169.96551513671875, 176.20115661621094, 182.43679809570312, 188.6724395751953, 194.9080810546875, 201.1437225341797, 207.37936401367188, 213.614990234375, 219.8506317138672, 226.08627319335938, 232.32191467285156, 238.55755615234375, 244.79319763183594, 251.02883911132812, 257.26446533203125, 263.5001220703125, 269.7357482910156, 275.97137451171875, 282.20703125, 288.4426574707031, 294.6783142089844, 300.9139404296875, 307.14959716796875, 313.3852233886719, 319.6208801269531]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 3.0, 3.0, 10.0, 7.0, 11.0, 11.0, 16.0, 15.0, 13.0, 21.0, 22.0, 25.0, 18.0, 35.0, 31.0, 29.0, 37.0, 32.0, 40.0, 35.0, 39.0, 47.0, 36.0, 41.0, 25.0, 34.0, 49.0, 47.0, 28.0, 28.0, 19.0, 34.0, 24.0, 26.0, 14.0, 17.0, 11.0, 9.0, 13.0, 8.0, 12.0, 4.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-26.04438018798828, -25.22437286376953, -24.40436363220215, -23.5843563079834, -22.764347076416016, -21.944339752197266, -21.124332427978516, -20.304323196411133, -19.484315872192383, -18.664308547973633, -17.84429931640625, -17.0242919921875, -16.204282760620117, -15.384275436401367, -14.5642671585083, -13.744258880615234, -12.924250602722168, -12.104242324829102, -11.284234046936035, -10.464225769042969, -9.644218444824219, -8.824210166931152, -8.004201889038086, -7.184194087982178, -6.364185810089111, -5.544177532196045, -4.724169731140137, -3.9041614532470703, -3.084153413772583, -2.2641453742980957, -1.4441370964050293, -0.6241292953491211, 0.1958789825439453, 1.0158870220184326, 1.8358951807022095, 2.6559033393859863, 3.4759113788604736, 4.295919418334961, 5.115927696228027, 5.9359354972839355, 6.755943775177002, 7.575952053070068, 8.395959854125977, 9.215968132019043, 10.03597640991211, 10.85598373413086, 11.675992965698242, 12.496000289916992, 13.316008567810059, 14.136016845703125, 14.956025123596191, 15.776033401489258, 16.596040725708008, 17.41604995727539, 18.23605728149414, 19.05606460571289, 19.876073837280273, 20.696081161499023, 21.516090393066406, 22.336097717285156, 23.15610694885254, 23.97611427307129, 24.796123504638672, 25.616130828857422, 26.436138153076172]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 7.0, 12.0, 12.0, 15.0, 8.0, 18.0, 19.0, 21.0, 17.0, 35.0, 37.0, 34.0, 37.0, 46.0, 48.0, 44.0, 47.0, 46.0, 45.0, 37.0, 31.0, 50.0, 39.0, 35.0, 35.0, 31.0, 28.0, 27.0, 27.0, 16.0, 13.0, 19.0, 11.0, 11.0, 6.0, 6.0, 7.0, 7.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.4959716796875, -2.409912109375, -2.3238525390625, -2.23779296875, -2.1517333984375, -2.065673828125, -1.9796142578125, -1.8935546875, -1.8074951171875, -1.721435546875, -1.6353759765625, -1.54931640625, -1.4632568359375, -1.377197265625, -1.2911376953125, -1.205078125, -1.1190185546875, -1.032958984375, -0.9468994140625, -0.86083984375, -0.7747802734375, -0.688720703125, -0.6026611328125, -0.5166015625, -0.4305419921875, -0.344482421875, -0.2584228515625, -0.17236328125, -0.0863037109375, -0.000244140625, 0.0858154296875, 0.171875, 0.2579345703125, 0.343994140625, 0.4300537109375, 0.51611328125, 0.6021728515625, 0.688232421875, 0.7742919921875, 0.8603515625, 0.9464111328125, 1.032470703125, 1.1185302734375, 1.20458984375, 1.2906494140625, 1.376708984375, 1.4627685546875, 1.548828125, 1.6348876953125, 1.720947265625, 1.8070068359375, 1.89306640625, 1.9791259765625, 2.065185546875, 2.1512451171875, 2.2373046875, 2.3233642578125, 2.409423828125, 2.4954833984375, 2.58154296875, 2.6676025390625, 2.753662109375, 2.8397216796875, 2.92578125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 8.0, 13.0, 9.0, 12.0, 19.0, 32.0, 50.0, 53.0, 73.0, 108.0, 144.0, 190.0, 281.0, 486.0, 842.0, 1864.0, 4628.0, 15994.0, 74950.0, 590109.0, 2795175.0, 606658.0, 76989.0, 16401.0, 4995.0, 1791.0, 874.0, 461.0, 275.0, 202.0, 145.0, 133.0, 90.0, 59.0, 38.0, 28.0, 25.0, 18.0, 16.0, 14.0, 10.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4765625, -9.1553955078125, -8.834228515625, -8.5130615234375, -8.19189453125, -7.8707275390625, -7.549560546875, -7.2283935546875, -6.9072265625, -6.5860595703125, -6.264892578125, -5.9437255859375, -5.62255859375, -5.3013916015625, -4.980224609375, -4.6590576171875, -4.337890625, -4.0167236328125, -3.695556640625, -3.3743896484375, -3.05322265625, -2.7320556640625, -2.410888671875, -2.0897216796875, -1.7685546875, -1.4473876953125, -1.126220703125, -0.8050537109375, -0.48388671875, -0.1627197265625, 0.158447265625, 0.4796142578125, 0.80078125, 1.1219482421875, 1.443115234375, 1.7642822265625, 2.08544921875, 2.4066162109375, 2.727783203125, 3.0489501953125, 3.3701171875, 3.6912841796875, 4.012451171875, 4.3336181640625, 4.65478515625, 4.9759521484375, 5.297119140625, 5.6182861328125, 5.939453125, 6.2606201171875, 6.581787109375, 6.9029541015625, 7.22412109375, 7.5452880859375, 7.866455078125, 8.1876220703125, 8.5087890625, 8.8299560546875, 9.151123046875, 9.4722900390625, 9.79345703125, 10.1146240234375, 10.435791015625, 10.7569580078125, 11.078125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 7.0, 13.0, 24.0, 37.0, 30.0, 57.0, 68.0, 84.0, 111.0, 178.0, 208.0, 246.0, 279.0, 414.0, 404.0, 377.0, 350.0, 277.0, 243.0, 187.0, 123.0, 83.0, 72.0, 46.0, 47.0, 21.0, 28.0, 10.0, 10.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.828125, -10.54107666015625, -10.2540283203125, -9.96697998046875, -9.679931640625, -9.39288330078125, -9.1058349609375, -8.81878662109375, -8.53173828125, -8.24468994140625, -7.9576416015625, -7.67059326171875, -7.383544921875, -7.09649658203125, -6.8094482421875, -6.52239990234375, -6.2353515625, -5.94830322265625, -5.6612548828125, -5.37420654296875, -5.087158203125, -4.80010986328125, -4.5130615234375, -4.22601318359375, -3.93896484375, -3.65191650390625, -3.3648681640625, -3.07781982421875, -2.790771484375, -2.50372314453125, -2.2166748046875, -1.92962646484375, -1.642578125, -1.35552978515625, -1.0684814453125, -0.78143310546875, -0.494384765625, -0.20733642578125, 0.0797119140625, 0.36676025390625, 0.65380859375, 0.94085693359375, 1.2279052734375, 1.51495361328125, 1.802001953125, 2.08905029296875, 2.3760986328125, 2.66314697265625, 2.9501953125, 3.23724365234375, 3.5242919921875, 3.81134033203125, 4.098388671875, 4.38543701171875, 4.6724853515625, 4.95953369140625, 5.24658203125, 5.53363037109375, 5.8206787109375, 6.10772705078125, 6.394775390625, 6.68182373046875, 6.9688720703125, 7.25592041015625, 7.54296875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 7.0, 4.0, 6.0, 9.0, 10.0, 15.0, 36.0, 40.0, 38.0, 66.0, 117.0, 187.0, 402.0, 887.0, 3103.0, 27988.0, 1003065.0, 3048841.0, 100878.0, 6116.0, 1352.0, 501.0, 230.0, 124.0, 73.0, 51.0, 47.0, 21.0, 21.0, 14.0, 8.0, 4.0, 3.0, 10.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -18.86865234375, -18.0185546875, -17.16845703125, -16.318359375, -15.46826171875, -14.6181640625, -13.76806640625, -12.91796875, -12.06787109375, -11.2177734375, -10.36767578125, -9.517578125, -8.66748046875, -7.8173828125, -6.96728515625, -6.1171875, -5.26708984375, -4.4169921875, -3.56689453125, -2.716796875, -1.86669921875, -1.0166015625, -0.16650390625, 0.68359375, 1.53369140625, 2.3837890625, 3.23388671875, 4.083984375, 4.93408203125, 5.7841796875, 6.63427734375, 7.484375, 8.33447265625, 9.1845703125, 10.03466796875, 10.884765625, 11.73486328125, 12.5849609375, 13.43505859375, 14.28515625, 15.13525390625, 15.9853515625, 16.83544921875, 17.685546875, 18.53564453125, 19.3857421875, 20.23583984375, 21.0859375, 21.93603515625, 22.7861328125, 23.63623046875, 24.486328125, 25.33642578125, 26.1865234375, 27.03662109375, 27.88671875, 28.73681640625, 29.5869140625, 30.43701171875, 31.287109375, 32.13720703125, 32.9873046875, 33.83740234375, 34.6875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 24.0, 178.0, 529.0, 251.0, 31.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.37868881225586, -55.20637512207031, -50.03406524658203, -44.861751556396484, -39.68943786621094, -34.517127990722656, -29.34481430053711, -24.172504425048828, -19.00019073486328, -13.827878952026367, -8.655566215515137, -3.4832534790039062, 1.6890583038330078, 6.861370086669922, 12.033683776855469, 17.20599365234375, 22.378307342529297, 27.55061912536621, 32.722930908203125, 37.89524459838867, 43.06755828857422, 48.2398681640625, 53.41218185424805, 58.58449172973633, 63.756805419921875, 68.92911529541016, 74.10143280029297, 79.27374267578125, 84.44605255126953, 89.61836242675781, 94.79067993164062, 99.9629898071289, 105.13529968261719, 110.30760955810547, 115.47992706298828, 120.65223693847656, 125.82454681396484, 130.99685668945312, 136.16917419433594, 141.34149169921875, 146.5137939453125, 151.6861114501953, 156.85841369628906, 162.03073120117188, 167.2030487060547, 172.37535095214844, 177.54766845703125, 182.719970703125, 187.89230346679688, 193.0646209716797, 198.23692321777344, 203.40924072265625, 208.58155822753906, 213.7538604736328, 218.92617797851562, 224.09848022460938, 229.2707977294922, 234.443115234375, 239.61541748046875, 244.78773498535156, 249.96005249023438, 255.13235473632812, 260.3046875, 265.47698974609375, 270.6492919921875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 6.0, 8.0, 6.0, 12.0, 10.0, 18.0, 13.0, 25.0, 25.0, 31.0, 24.0, 29.0, 30.0, 33.0, 29.0, 24.0, 42.0, 43.0, 41.0, 53.0, 36.0, 38.0, 36.0, 45.0, 26.0, 45.0, 29.0, 26.0, 35.0, 25.0, 24.0, 23.0, 12.0, 24.0, 10.0, 10.0, 12.0, 10.0, 11.0, 5.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.33553695678711, -28.34575843811035, -27.355981826782227, -26.36620330810547, -25.37642478942871, -24.386646270751953, -23.396869659423828, -22.40709114074707, -21.417312622070312, -20.427534103393555, -19.43775749206543, -18.447978973388672, -17.458200454711914, -16.468421936035156, -15.478645324707031, -14.488866806030273, -13.499089241027832, -12.50931167602539, -11.519533157348633, -10.529755592346191, -9.539977073669434, -8.550199508666992, -7.560421466827393, -6.570643424987793, -5.580865383148193, -4.591087341308594, -3.601309299468994, -2.6115314960479736, -1.621753454208374, -0.6319756507873535, 0.3578023910522461, 1.3475804328918457, 2.3373584747314453, 3.327136516571045, 4.3169145584106445, 5.306692123413086, 6.296470642089844, 7.286248207092285, 8.276025772094727, 9.265804290771484, 10.255582809448242, 11.245360374450684, 12.235138893127441, 13.224916458129883, 14.21469497680664, 15.204472541809082, 16.194250106811523, 17.18402862548828, 18.173805236816406, 19.163583755493164, 20.15336036682129, 21.143138885498047, 22.132917404174805, 23.122695922851562, 24.112472534179688, 25.102251052856445, 26.092029571533203, 27.08180809020996, 28.071584701538086, 29.061363220214844, 30.0511417388916, 31.04092025756836, 32.030696868896484, 33.020477294921875, 34.01025390625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 3.0, 12.0, 9.0, 13.0, 9.0, 11.0, 12.0, 27.0, 31.0, 23.0, 16.0, 31.0, 32.0, 37.0, 29.0, 34.0, 27.0, 39.0, 25.0, 45.0, 47.0, 42.0, 43.0, 37.0, 41.0, 31.0, 22.0, 33.0, 26.0, 23.0, 28.0, 21.0, 11.0, 19.0, 10.0, 17.0, 12.0, 9.0, 13.0, 3.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-2.578125, -2.500579833984375, -2.42303466796875, -2.345489501953125, -2.2679443359375, -2.190399169921875, -2.11285400390625, -2.035308837890625, -1.957763671875, -1.880218505859375, -1.80267333984375, -1.725128173828125, -1.6475830078125, -1.570037841796875, -1.49249267578125, -1.414947509765625, -1.33740234375, -1.259857177734375, -1.18231201171875, -1.104766845703125, -1.0272216796875, -0.949676513671875, -0.87213134765625, -0.794586181640625, -0.717041015625, -0.639495849609375, -0.56195068359375, -0.484405517578125, -0.4068603515625, -0.329315185546875, -0.25177001953125, -0.174224853515625, -0.0966796875, -0.019134521484375, 0.05841064453125, 0.135955810546875, 0.2135009765625, 0.291046142578125, 0.36859130859375, 0.446136474609375, 0.523681640625, 0.601226806640625, 0.67877197265625, 0.756317138671875, 0.8338623046875, 0.911407470703125, 0.98895263671875, 1.066497802734375, 1.14404296875, 1.221588134765625, 1.29913330078125, 1.376678466796875, 1.4542236328125, 1.531768798828125, 1.60931396484375, 1.686859130859375, 1.764404296875, 1.841949462890625, 1.91949462890625, 1.997039794921875, 2.0745849609375, 2.152130126953125, 2.22967529296875, 2.307220458984375, 2.384765625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 6.0, 12.0, 13.0, 26.0, 26.0, 36.0, 83.0, 96.0, 145.0, 209.0, 287.0, 453.0, 651.0, 985.0, 1444.0, 2042.0, 3081.0, 4474.0, 6737.0, 10196.0, 15216.0, 22400.0, 34304.0, 52072.0, 80125.0, 123075.0, 172778.0, 169600.0, 119417.0, 77822.0, 50672.0, 33179.0, 22225.0, 14690.0, 9617.0, 6713.0, 4373.0, 3033.0, 1977.0, 1364.0, 924.0, 628.0, 440.0, 290.0, 203.0, 127.0, 101.0, 68.0, 39.0, 33.0, 16.0, 9.0, 10.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1778564453125, -0.1719207763671875, -0.165985107421875, -0.1600494384765625, -0.15411376953125, -0.1481781005859375, -0.142242431640625, -0.1363067626953125, -0.13037109375, -0.1244354248046875, -0.118499755859375, -0.1125640869140625, -0.10662841796875, -0.1006927490234375, -0.094757080078125, -0.0888214111328125, -0.0828857421875, -0.0769500732421875, -0.071014404296875, -0.0650787353515625, -0.05914306640625, -0.0532073974609375, -0.047271728515625, -0.0413360595703125, -0.035400390625, -0.0294647216796875, -0.023529052734375, -0.0175933837890625, -0.01165771484375, -0.0057220458984375, 0.000213623046875, 0.0061492919921875, 0.0120849609375, 0.0180206298828125, 0.023956298828125, 0.0298919677734375, 0.03582763671875, 0.0417633056640625, 0.047698974609375, 0.0536346435546875, 0.0595703125, 0.0655059814453125, 0.071441650390625, 0.0773773193359375, 0.08331298828125, 0.0892486572265625, 0.095184326171875, 0.1011199951171875, 0.1070556640625, 0.1129913330078125, 0.118927001953125, 0.1248626708984375, 0.13079833984375, 0.1367340087890625, 0.142669677734375, 0.1486053466796875, 0.154541015625, 0.1604766845703125, 0.166412353515625, 0.1723480224609375, 0.17828369140625, 0.1842193603515625, 0.190155029296875, 0.1960906982421875, 0.2020263671875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 6.0, 13.0, 12.0, 8.0, 20.0, 22.0, 16.0, 24.0, 26.0, 30.0, 36.0, 40.0, 37.0, 42.0, 41.0, 43.0, 37.0, 1077.0, 43.0, 50.0, 36.0, 35.0, 44.0, 30.0, 48.0, 35.0, 37.0, 26.0, 28.0, 14.0, 10.0, 10.0, 16.0, 11.0, 5.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.05859375, -1.99847412109375, -1.9383544921875, -1.87823486328125, -1.818115234375, -1.75799560546875, -1.6978759765625, -1.63775634765625, -1.57763671875, -1.51751708984375, -1.4573974609375, -1.39727783203125, -1.337158203125, -1.27703857421875, -1.2169189453125, -1.15679931640625, -1.0966796875, -1.03656005859375, -0.9764404296875, -0.91632080078125, -0.856201171875, -0.79608154296875, -0.7359619140625, -0.67584228515625, -0.61572265625, -0.55560302734375, -0.4954833984375, -0.43536376953125, -0.375244140625, -0.31512451171875, -0.2550048828125, -0.19488525390625, -0.134765625, -0.07464599609375, -0.0145263671875, 0.04559326171875, 0.105712890625, 0.16583251953125, 0.2259521484375, 0.28607177734375, 0.34619140625, 0.40631103515625, 0.4664306640625, 0.52655029296875, 0.586669921875, 0.64678955078125, 0.7069091796875, 0.76702880859375, 0.8271484375, 0.88726806640625, 0.9473876953125, 1.00750732421875, 1.067626953125, 1.12774658203125, 1.1878662109375, 1.24798583984375, 1.30810546875, 1.36822509765625, 1.4283447265625, 1.48846435546875, 1.548583984375, 1.60870361328125, 1.6688232421875, 1.72894287109375, 1.7890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 8.0, 9.0, 12.0, 16.0, 20.0, 34.0, 49.0, 57.0, 75.0, 134.0, 204.0, 283.0, 418.0, 580.0, 940.0, 1322.0, 2040.0, 3087.0, 4834.0, 7391.0, 11676.0, 18656.0, 29371.0, 46772.0, 73751.0, 115592.0, 165012.0, 1228425.0, 137955.0, 90577.0, 57942.0, 36821.0, 22751.0, 14441.0, 8987.0, 5939.0, 3751.0, 2369.0, 1619.0, 1079.0, 650.0, 490.0, 328.0, 234.0, 136.0, 95.0, 73.0, 36.0, 31.0, 19.0, 19.0, 9.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.1707763671875, -0.16530799865722656, -0.15983963012695312, -0.1543712615966797, -0.14890289306640625, -0.1434345245361328, -0.13796615600585938, -0.13249778747558594, -0.1270294189453125, -0.12156105041503906, -0.11609268188476562, -0.11062431335449219, -0.10515594482421875, -0.09968757629394531, -0.09421920776367188, -0.08875083923339844, -0.083282470703125, -0.07781410217285156, -0.07234573364257812, -0.06687736511230469, -0.06140899658203125, -0.05594062805175781, -0.050472259521484375, -0.04500389099121094, -0.0395355224609375, -0.03406715393066406, -0.028598785400390625, -0.023130416870117188, -0.01766204833984375, -0.012193679809570312, -0.006725311279296875, -0.0012569427490234375, 0.00421142578125, 0.009679794311523438, 0.015148162841796875, 0.020616531372070312, 0.02608489990234375, 0.03155326843261719, 0.037021636962890625, 0.04249000549316406, 0.0479583740234375, 0.05342674255371094, 0.058895111083984375, 0.06436347961425781, 0.06983184814453125, 0.07530021667480469, 0.08076858520507812, 0.08623695373535156, 0.091705322265625, 0.09717369079589844, 0.10264205932617188, 0.10811042785644531, 0.11357879638671875, 0.11904716491699219, 0.12451553344726562, 0.12998390197753906, 0.1354522705078125, 0.14092063903808594, 0.14638900756835938, 0.1518573760986328, 0.15732574462890625, 0.1627941131591797, 0.16826248168945312, 0.17373085021972656, 0.17919921875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 9.0, 13.0, 5.0, 8.0, 9.0, 9.0, 24.0, 19.0, 26.0, 39.0, 32.0, 33.0, 51.0, 60.0, 51.0, 75.0, 71.0, 68.0, 51.0, 61.0, 43.0, 39.0, 39.0, 28.0, 23.0, 19.0, 19.0, 16.0, 9.0, 13.0, 9.0, 7.0, 2.0, 0.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006823539733886719, -0.0006617531180381775, -0.0006411522626876831, -0.0006205514073371887, -0.0005999505519866943, -0.0005793496966362, -0.0005587488412857056, -0.0005381479859352112, -0.0005175471305847168, -0.0004969462752342224, -0.00047634541988372803, -0.00045574456453323364, -0.00043514370918273926, -0.0004145428538322449, -0.0003939419984817505, -0.0003733411431312561, -0.0003527402877807617, -0.00033213943243026733, -0.00031153857707977295, -0.00029093772172927856, -0.0002703368663787842, -0.0002497360110282898, -0.0002291351556777954, -0.00020853430032730103, -0.00018793344497680664, -0.00016733258962631226, -0.00014673173427581787, -0.00012613087892532349, -0.0001055300235748291, -8.492916822433472e-05, -6.432831287384033e-05, -4.372745752334595e-05, -2.3126602172851562e-05, -2.5257468223571777e-06, 1.8075108528137207e-05, 3.867596387863159e-05, 5.9276819229125977e-05, 7.987767457962036e-05, 0.00010047852993011475, 0.00012107938528060913, 0.00014168024063110352, 0.0001622810959815979, 0.00018288195133209229, 0.00020348280668258667, 0.00022408366203308105, 0.00024468451738357544, 0.0002652853727340698, 0.0002858862280845642, 0.0003064870834350586, 0.000327087938785553, 0.00034768879413604736, 0.00036828964948654175, 0.00038889050483703613, 0.0004094913601875305, 0.0004300922155380249, 0.0004506930708885193, 0.00047129392623901367, 0.0004918947815895081, 0.0005124956369400024, 0.0005330964922904968, 0.0005536973476409912, 0.0005742982029914856, 0.00059489905834198, 0.0006154999136924744, 0.0006361007690429688]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 9.0, 2.0, 3.0, 4.0, 8.0, 4.0, 12.0, 16.0, 17.0, 28.0, 39.0, 32.0, 33.0, 39.0, 40.0, 60.0, 70.0, 94.0, 122.0, 142.0, 220.0, 388.0, 715.0, 12120.0, 1010937.0, 21079.0, 820.0, 411.0, 250.0, 165.0, 139.0, 109.0, 91.0, 56.0, 59.0, 45.0, 26.0, 45.0, 21.0, 15.0, 15.0, 12.0, 9.0, 9.0, 7.0, 4.0, 3.0, 4.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.01049041748046875, -0.010168075561523438, -0.009845733642578125, -0.009523391723632812, -0.0092010498046875, -0.008878707885742188, -0.008556365966796875, -0.008234024047851562, -0.00791168212890625, -0.0075893402099609375, -0.007266998291015625, -0.0069446563720703125, -0.006622314453125, -0.0062999725341796875, -0.005977630615234375, -0.0056552886962890625, -0.00533294677734375, -0.0050106048583984375, -0.004688262939453125, -0.0043659210205078125, -0.0040435791015625, -0.0037212371826171875, -0.003398895263671875, -0.0030765533447265625, -0.00275421142578125, -0.0024318695068359375, -0.002109527587890625, -0.0017871856689453125, -0.00146484375, -0.0011425018310546875, -0.000820159912109375, -0.0004978179931640625, -0.00017547607421875, 0.0001468658447265625, 0.000469207763671875, 0.0007915496826171875, 0.0011138916015625, 0.0014362335205078125, 0.001758575439453125, 0.0020809173583984375, 0.00240325927734375, 0.0027256011962890625, 0.003047943115234375, 0.0033702850341796875, 0.003692626953125, 0.0040149688720703125, 0.004337310791015625, 0.0046596527099609375, 0.00498199462890625, 0.0053043365478515625, 0.005626678466796875, 0.0059490203857421875, 0.0062713623046875, 0.0065937042236328125, 0.006916046142578125, 0.0072383880615234375, 0.00756072998046875, 0.007883071899414062, 0.008205413818359375, 0.008527755737304688, 0.00885009765625, 0.009172439575195312, 0.009494781494140625, 0.009817123413085938, 0.01013946533203125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 63.0, 516.0, 403.0, 28.0, 3.0], "bins": [-0.004223145544528961, -0.004153778776526451, -0.004084412008523941, -0.004015045240521431, -0.003945678472518921, -0.003876311471685767, -0.003806944703683257, -0.0037375777028501034, -0.0036682109348475933, -0.0035988441668450832, -0.003529477398842573, -0.0034601103980094194, -0.0033907436300069094, -0.0033213768620043993, -0.0032520100940018892, -0.0031826430931687355, -0.0031132763251662254, -0.0030439095571637154, -0.0029745427891612053, -0.0029051757883280516, -0.0028358090203255415, -0.0027664422523230314, -0.0026970754843205214, -0.0026277084834873676, -0.002558341948315501, -0.002488975180312991, -0.002419608412310481, -0.0023502414114773273, -0.0022808746434748173, -0.002211507875472307, -0.002142141107469797, -0.002072774339467287, -0.0020034073386341333, -0.0019340405706316233, -0.0018646736862137914, -0.0017953069182112813, -0.0017259400337934494, -0.0016565732657909393, -0.0015872064977884293, -0.0015178396133705974, -0.0014484727289527655, -0.0013791059609502554, -0.0013097390765324235, -0.0012403723085299134, -0.0011710054241120815, -0.0011016386561095715, -0.0010322718881070614, -0.0009629050036892295, -0.0008935381192713976, -0.0008241712930612266, -0.0007548044668510556, -0.0006854376988485456, -0.0006160708144307137, -0.0005467040464282036, -0.0004773372202180326, -0.0004079703940078616, -0.00033860356779769063, -0.00026923674158751965, -0.0001998699299292639, -0.00013050311827100813, -6.113629206083715e-05, 8.230534149333835e-06, 7.759733125567436e-05, 0.00014696415746584535, 0.0002163309691241011]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 19.0, 18.0, 25.0, 22.0, 17.0, 23.0, 28.0, 19.0, 28.0, 33.0, 26.0, 39.0, 44.0, 45.0, 44.0, 38.0, 43.0, 26.0, 48.0, 46.0, 36.0, 38.0, 31.0, 31.0, 26.0, 23.0, 26.0, 24.0, 17.0, 21.0, 17.0, 15.0, 11.0, 9.0, 8.0, 4.0, 7.0, 6.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0003572702407836914, -0.0003469865769147873, -0.0003367029130458832, -0.00032641924917697906, -0.00031613558530807495, -0.00030585192143917084, -0.0002955682575702667, -0.0002852845937013626, -0.0002750009298324585, -0.0002647172659635544, -0.00025443360209465027, -0.00024414993822574615, -0.00023386627435684204, -0.00022358261048793793, -0.0002132989466190338, -0.0002030152827501297, -0.00019273161888122559, -0.00018244795501232147, -0.00017216429114341736, -0.00016188062727451324, -0.00015159696340560913, -0.00014131329953670502, -0.0001310296356678009, -0.00012074597179889679, -0.00011046230792999268, -0.00010017864406108856, -8.989498019218445e-05, -7.961131632328033e-05, -6.932765245437622e-05, -5.904398858547211e-05, -4.876032471656799e-05, -3.847666084766388e-05, -2.8192996978759766e-05, -1.7909333109855652e-05, -7.625669240951538e-06, 2.6579946279525757e-06, 1.294165849685669e-05, 2.3225322365760803e-05, 3.350898623466492e-05, 4.379265010356903e-05, 5.4076313972473145e-05, 6.435997784137726e-05, 7.464364171028137e-05, 8.492730557918549e-05, 9.52109694480896e-05, 0.00010549463331699371, 0.00011577829718589783, 0.00012606196105480194, 0.00013634562492370605, 0.00014662928879261017, 0.00015691295266151428, 0.0001671966165304184, 0.0001774802803993225, 0.00018776394426822662, 0.00019804760813713074, 0.00020833127200603485, 0.00021861493587493896, 0.00022889859974384308, 0.0002391822636127472, 0.0002494659274816513, 0.0002597495913505554, 0.00027003325521945953, 0.00028031691908836365, 0.00029060058295726776, 0.0003008842468261719]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 3.0, 12.0, 9.0, 13.0, 9.0, 11.0, 12.0, 27.0, 31.0, 23.0, 16.0, 31.0, 32.0, 37.0, 29.0, 34.0, 27.0, 39.0, 25.0, 45.0, 47.0, 42.0, 43.0, 37.0, 41.0, 31.0, 22.0, 33.0, 26.0, 23.0, 28.0, 21.0, 11.0, 19.0, 10.0, 17.0, 12.0, 9.0, 13.0, 3.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-2.578125, -2.500579833984375, -2.42303466796875, -2.345489501953125, -2.2679443359375, -2.190399169921875, -2.11285400390625, -2.035308837890625, -1.957763671875, -1.880218505859375, -1.80267333984375, -1.725128173828125, -1.6475830078125, -1.570037841796875, -1.49249267578125, -1.414947509765625, -1.33740234375, -1.259857177734375, -1.18231201171875, -1.104766845703125, -1.0272216796875, -0.949676513671875, -0.87213134765625, -0.794586181640625, -0.717041015625, -0.639495849609375, -0.56195068359375, -0.484405517578125, -0.4068603515625, -0.329315185546875, -0.25177001953125, -0.174224853515625, -0.0966796875, -0.019134521484375, 0.05841064453125, 0.135955810546875, 0.2135009765625, 0.291046142578125, 0.36859130859375, 0.446136474609375, 0.523681640625, 0.601226806640625, 0.67877197265625, 0.756317138671875, 0.8338623046875, 0.911407470703125, 0.98895263671875, 1.066497802734375, 1.14404296875, 1.221588134765625, 1.29913330078125, 1.376678466796875, 1.4542236328125, 1.531768798828125, 1.60931396484375, 1.686859130859375, 1.764404296875, 1.841949462890625, 1.91949462890625, 1.997039794921875, 2.0745849609375, 2.152130126953125, 2.22967529296875, 2.307220458984375, 2.384765625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 15.0, 18.0, 24.0, 21.0, 30.0, 52.0, 70.0, 101.0, 131.0, 202.0, 269.0, 395.0, 617.0, 1141.0, 2240.0, 4461.0, 10154.0, 23990.0, 60426.0, 144013.0, 266518.0, 272482.0, 150818.0, 64065.0, 25538.0, 10519.0, 4709.0, 2251.0, 1172.0, 704.0, 418.0, 281.0, 201.0, 152.0, 95.0, 72.0, 51.0, 39.0, 27.0, 19.0, 13.0, 7.0, 7.0, 7.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.08203125, -2.985809326171875, -2.88958740234375, -2.793365478515625, -2.6971435546875, -2.600921630859375, -2.50469970703125, -2.408477783203125, -2.312255859375, -2.216033935546875, -2.11981201171875, -2.023590087890625, -1.9273681640625, -1.831146240234375, -1.73492431640625, -1.638702392578125, -1.54248046875, -1.446258544921875, -1.35003662109375, -1.253814697265625, -1.1575927734375, -1.061370849609375, -0.96514892578125, -0.868927001953125, -0.772705078125, -0.676483154296875, -0.58026123046875, -0.484039306640625, -0.3878173828125, -0.291595458984375, -0.19537353515625, -0.099151611328125, -0.0029296875, 0.093292236328125, 0.18951416015625, 0.285736083984375, 0.3819580078125, 0.478179931640625, 0.57440185546875, 0.670623779296875, 0.766845703125, 0.863067626953125, 0.95928955078125, 1.055511474609375, 1.1517333984375, 1.247955322265625, 1.34417724609375, 1.440399169921875, 1.53662109375, 1.632843017578125, 1.72906494140625, 1.825286865234375, 1.9215087890625, 2.017730712890625, 2.11395263671875, 2.210174560546875, 2.306396484375, 2.402618408203125, 2.49884033203125, 2.595062255859375, 2.6912841796875, 2.787506103515625, 2.88372802734375, 2.979949951171875, 3.076171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 1.0, 15.0, 6.0, 8.0, 8.0, 14.0, 17.0, 23.0, 30.0, 22.0, 22.0, 26.0, 28.0, 35.0, 39.0, 57.0, 45.0, 108.0, 207.0, 1361.0, 286.0, 152.0, 112.0, 75.0, 49.0, 34.0, 36.0, 33.0, 26.0, 35.0, 16.0, 22.0, 14.0, 12.0, 19.0, 10.0, 7.0, 5.0, 6.0, 6.0, 9.0, 4.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.3834228515625, -9.079345703125, -8.7752685546875, -8.47119140625, -8.1671142578125, -7.863037109375, -7.5589599609375, -7.2548828125, -6.9508056640625, -6.646728515625, -6.3426513671875, -6.03857421875, -5.7344970703125, -5.430419921875, -5.1263427734375, -4.822265625, -4.5181884765625, -4.214111328125, -3.9100341796875, -3.60595703125, -3.3018798828125, -2.997802734375, -2.6937255859375, -2.3896484375, -2.0855712890625, -1.781494140625, -1.4774169921875, -1.17333984375, -0.8692626953125, -0.565185546875, -0.2611083984375, 0.04296875, 0.3470458984375, 0.651123046875, 0.9552001953125, 1.25927734375, 1.5633544921875, 1.867431640625, 2.1715087890625, 2.4755859375, 2.7796630859375, 3.083740234375, 3.3878173828125, 3.69189453125, 3.9959716796875, 4.300048828125, 4.6041259765625, 4.908203125, 5.2122802734375, 5.516357421875, 5.8204345703125, 6.12451171875, 6.4285888671875, 6.732666015625, 7.0367431640625, 7.3408203125, 7.6448974609375, 7.948974609375, 8.2530517578125, 8.55712890625, 8.8612060546875, 9.165283203125, 9.4693603515625, 9.7734375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 9.0, 6.0, 8.0, 8.0, 6.0, 9.0, 13.0, 13.0, 19.0, 18.0, 26.0, 28.0, 43.0, 56.0, 80.0, 114.0, 180.0, 379.0, 994.0, 5638.0, 416284.0, 2701339.0, 17508.0, 1674.0, 517.0, 251.0, 135.0, 79.0, 50.0, 40.0, 21.0, 31.0, 22.0, 23.0, 20.0, 16.0, 14.0, 7.0, 6.0, 8.0, 9.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.546875, -19.88818359375, -19.2294921875, -18.57080078125, -17.912109375, -17.25341796875, -16.5947265625, -15.93603515625, -15.27734375, -14.61865234375, -13.9599609375, -13.30126953125, -12.642578125, -11.98388671875, -11.3251953125, -10.66650390625, -10.0078125, -9.34912109375, -8.6904296875, -8.03173828125, -7.373046875, -6.71435546875, -6.0556640625, -5.39697265625, -4.73828125, -4.07958984375, -3.4208984375, -2.76220703125, -2.103515625, -1.44482421875, -0.7861328125, -0.12744140625, 0.53125, 1.18994140625, 1.8486328125, 2.50732421875, 3.166015625, 3.82470703125, 4.4833984375, 5.14208984375, 5.80078125, 6.45947265625, 7.1181640625, 7.77685546875, 8.435546875, 9.09423828125, 9.7529296875, 10.41162109375, 11.0703125, 11.72900390625, 12.3876953125, 13.04638671875, 13.705078125, 14.36376953125, 15.0224609375, 15.68115234375, 16.33984375, 16.99853515625, 17.6572265625, 18.31591796875, 18.974609375, 19.63330078125, 20.2919921875, 20.95068359375, 21.609375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 28.0, 187.0, 468.0, 259.0, 61.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.43870162963867, -55.869876861572266, -54.30105209350586, -52.73222732543945, -51.16339874267578, -49.594573974609375, -48.02574920654297, -46.45692443847656, -44.888099670410156, -43.31927490234375, -41.750450134277344, -40.18162536621094, -38.61280059814453, -37.04397201538086, -35.47514724731445, -33.90632247924805, -32.33749771118164, -30.768672943115234, -29.199848175048828, -27.63102149963379, -26.062196731567383, -24.493371963500977, -22.924545288085938, -21.35572052001953, -19.786895751953125, -18.21807098388672, -16.649246215820312, -15.080419540405273, -13.511594772338867, -11.942770004272461, -10.373944282531738, -8.805118560791016, -7.236293792724609, -5.667468547821045, -4.0986433029174805, -2.529818058013916, -0.9609928131103516, 0.6078324317932129, 2.1766576766967773, 3.7454833984375, 5.314308166503906, 6.883133411407471, 8.451958656311035, 10.020784378051758, 11.589609146118164, 13.15843391418457, 14.727259635925293, 16.296085357666016, 17.864910125732422, 19.433734893798828, 21.002559661865234, 22.571386337280273, 24.14021110534668, 25.709035873413086, 27.277862548828125, 28.84668731689453, 30.415512084960938, 31.984336853027344, 33.55316162109375, 35.121986389160156, 36.69081115722656, 38.259639739990234, 39.82846450805664, 41.39728927612305, 42.96611404418945]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 3.0, 7.0, 11.0, 10.0, 10.0, 7.0, 23.0, 26.0, 23.0, 23.0, 28.0, 32.0, 17.0, 23.0, 29.0, 33.0, 59.0, 42.0, 51.0, 31.0, 39.0, 29.0, 39.0, 24.0, 42.0, 28.0, 26.0, 35.0, 33.0, 37.0, 30.0, 19.0, 19.0, 19.0, 8.0, 15.0, 15.0, 10.0, 7.0, 7.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-30.044788360595703, -29.11012077331543, -28.175453186035156, -27.240785598754883, -26.30611801147461, -25.371450424194336, -24.436782836914062, -23.50211524963379, -22.567447662353516, -21.632780075073242, -20.69811248779297, -19.763444900512695, -18.828777313232422, -17.89410972595215, -16.959442138671875, -16.0247745513916, -15.090106964111328, -14.155439376831055, -13.220771789550781, -12.286104202270508, -11.351436614990234, -10.416769027709961, -9.482101440429688, -8.547433853149414, -7.612766265869141, -6.678098678588867, -5.743431091308594, -4.80876350402832, -3.874095916748047, -2.9394283294677734, -2.0047607421875, -1.0700931549072266, -0.13542556762695312, 0.7992420196533203, 1.7339096069335938, 2.668577194213867, 3.6032447814941406, 4.537912368774414, 5.4725799560546875, 6.407247543334961, 7.341915130615234, 8.276582717895508, 9.211250305175781, 10.145917892456055, 11.080585479736328, 12.015253067016602, 12.949920654296875, 13.884588241577148, 14.819255828857422, 15.753923416137695, 16.68859100341797, 17.623258590698242, 18.557926177978516, 19.49259376525879, 20.427261352539062, 21.361928939819336, 22.29659652709961, 23.231264114379883, 24.165931701660156, 25.10059928894043, 26.035266876220703, 26.969934463500977, 27.90460205078125, 28.839269638061523, 29.773937225341797]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 7.0, 7.0, 4.0, 9.0, 6.0, 14.0, 7.0, 19.0, 15.0, 17.0, 24.0, 19.0, 22.0, 28.0, 24.0, 31.0, 33.0, 22.0, 39.0, 30.0, 35.0, 35.0, 43.0, 31.0, 51.0, 36.0, 41.0, 38.0, 29.0, 30.0, 30.0, 29.0, 24.0, 24.0, 17.0, 16.0, 15.0, 22.0, 14.0, 12.0, 8.0, 6.0, 7.0, 4.0, 3.0, 5.0, 6.0, 7.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0], "bins": [-2.63671875, -2.55706787109375, -2.4774169921875, -2.39776611328125, -2.318115234375, -2.23846435546875, -2.1588134765625, -2.07916259765625, -1.99951171875, -1.91986083984375, -1.8402099609375, -1.76055908203125, -1.680908203125, -1.60125732421875, -1.5216064453125, -1.44195556640625, -1.3623046875, -1.28265380859375, -1.2030029296875, -1.12335205078125, -1.043701171875, -0.96405029296875, -0.8843994140625, -0.80474853515625, -0.72509765625, -0.64544677734375, -0.5657958984375, -0.48614501953125, -0.406494140625, -0.32684326171875, -0.2471923828125, -0.16754150390625, -0.087890625, -0.00823974609375, 0.0714111328125, 0.15106201171875, 0.230712890625, 0.31036376953125, 0.3900146484375, 0.46966552734375, 0.54931640625, 0.62896728515625, 0.7086181640625, 0.78826904296875, 0.867919921875, 0.94757080078125, 1.0272216796875, 1.10687255859375, 1.1865234375, 1.26617431640625, 1.3458251953125, 1.42547607421875, 1.505126953125, 1.58477783203125, 1.6644287109375, 1.74407958984375, 1.82373046875, 1.90338134765625, 1.9830322265625, 2.06268310546875, 2.142333984375, 2.22198486328125, 2.3016357421875, 2.38128662109375, 2.4609375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 9.0, 6.0, 7.0, 11.0, 16.0, 18.0, 22.0, 30.0, 34.0, 39.0, 56.0, 68.0, 97.0, 205.0, 355.0, 856.0, 2490.0, 9780.0, 58993.0, 555934.0, 2787277.0, 691813.0, 70241.0, 11276.0, 2668.0, 966.0, 378.0, 181.0, 114.0, 69.0, 46.0, 41.0, 41.0, 24.0, 19.0, 21.0, 22.0, 13.0, 11.0, 14.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-10.8515625, -10.5462646484375, -10.240966796875, -9.9356689453125, -9.63037109375, -9.3250732421875, -9.019775390625, -8.7144775390625, -8.4091796875, -8.1038818359375, -7.798583984375, -7.4932861328125, -7.18798828125, -6.8826904296875, -6.577392578125, -6.2720947265625, -5.966796875, -5.6614990234375, -5.356201171875, -5.0509033203125, -4.74560546875, -4.4403076171875, -4.135009765625, -3.8297119140625, -3.5244140625, -3.2191162109375, -2.913818359375, -2.6085205078125, -2.30322265625, -1.9979248046875, -1.692626953125, -1.3873291015625, -1.08203125, -0.7767333984375, -0.471435546875, -0.1661376953125, 0.13916015625, 0.4444580078125, 0.749755859375, 1.0550537109375, 1.3603515625, 1.6656494140625, 1.970947265625, 2.2762451171875, 2.58154296875, 2.8868408203125, 3.192138671875, 3.4974365234375, 3.802734375, 4.1080322265625, 4.413330078125, 4.7186279296875, 5.02392578125, 5.3292236328125, 5.634521484375, 5.9398193359375, 6.2451171875, 6.5504150390625, 6.855712890625, 7.1610107421875, 7.46630859375, 7.7716064453125, 8.076904296875, 8.3822021484375, 8.6875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 1.0, 8.0, 10.0, 12.0, 20.0, 27.0, 44.0, 56.0, 77.0, 119.0, 138.0, 186.0, 271.0, 372.0, 459.0, 450.0, 458.0, 389.0, 267.0, 186.0, 136.0, 103.0, 89.0, 54.0, 46.0, 39.0, 21.0, 11.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.375, -12.0531005859375, -11.731201171875, -11.4093017578125, -11.08740234375, -10.7655029296875, -10.443603515625, -10.1217041015625, -9.7998046875, -9.4779052734375, -9.156005859375, -8.8341064453125, -8.51220703125, -8.1903076171875, -7.868408203125, -7.5465087890625, -7.224609375, -6.9027099609375, -6.580810546875, -6.2589111328125, -5.93701171875, -5.6151123046875, -5.293212890625, -4.9713134765625, -4.6494140625, -4.3275146484375, -4.005615234375, -3.6837158203125, -3.36181640625, -3.0399169921875, -2.718017578125, -2.3961181640625, -2.07421875, -1.7523193359375, -1.430419921875, -1.1085205078125, -0.78662109375, -0.4647216796875, -0.142822265625, 0.1790771484375, 0.5009765625, 0.8228759765625, 1.144775390625, 1.4666748046875, 1.78857421875, 2.1104736328125, 2.432373046875, 2.7542724609375, 3.076171875, 3.3980712890625, 3.719970703125, 4.0418701171875, 4.36376953125, 4.6856689453125, 5.007568359375, 5.3294677734375, 5.6513671875, 5.9732666015625, 6.295166015625, 6.6170654296875, 6.93896484375, 7.2608642578125, 7.582763671875, 7.9046630859375, 8.2265625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 16.0, 11.0, 26.0, 36.0, 63.0, 97.0, 221.0, 346.0, 787.0, 2109.0, 11850.0, 175439.0, 3002515.0, 950736.0, 43151.0, 4410.0, 1320.0, 536.0, 263.0, 131.0, 77.0, 63.0, 28.0, 14.0, 15.0, 6.0, 3.0, 6.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -18.861572265625, -18.12939453125, -17.397216796875, -16.6650390625, -15.932861328125, -15.20068359375, -14.468505859375, -13.736328125, -13.004150390625, -12.27197265625, -11.539794921875, -10.8076171875, -10.075439453125, -9.34326171875, -8.611083984375, -7.87890625, -7.146728515625, -6.41455078125, -5.682373046875, -4.9501953125, -4.218017578125, -3.48583984375, -2.753662109375, -2.021484375, -1.289306640625, -0.55712890625, 0.175048828125, 0.9072265625, 1.639404296875, 2.37158203125, 3.103759765625, 3.8359375, 4.568115234375, 5.30029296875, 6.032470703125, 6.7646484375, 7.496826171875, 8.22900390625, 8.961181640625, 9.693359375, 10.425537109375, 11.15771484375, 11.889892578125, 12.6220703125, 13.354248046875, 14.08642578125, 14.818603515625, 15.55078125, 16.282958984375, 17.01513671875, 17.747314453125, 18.4794921875, 19.211669921875, 19.94384765625, 20.676025390625, 21.408203125, 22.140380859375, 22.87255859375, 23.604736328125, 24.3369140625, 25.069091796875, 25.80126953125, 26.533447265625, 27.265625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 13.0, 21.0, 34.0, 74.0, 97.0, 139.0, 169.0, 143.0, 131.0, 76.0, 64.0, 28.0, 12.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-94.88855743408203, -93.08930206298828, -91.29005432128906, -89.49079895019531, -87.69154357910156, -85.89228820800781, -84.0930404663086, -82.29378509521484, -80.49453735351562, -78.69528198242188, -76.89603424072266, -75.0967788696289, -73.29752349853516, -71.49827575683594, -69.69902038574219, -67.89976501464844, -66.10050964355469, -64.30125427246094, -62.50200271606445, -60.70275115966797, -58.90349578857422, -57.104244232177734, -55.30499267578125, -53.5057373046875, -51.706485748291016, -49.90723419189453, -48.10797882080078, -46.3087272644043, -44.50947570800781, -42.71022033691406, -40.91096878051758, -39.111717224121094, -37.312461853027344, -35.51321029663086, -33.71395492553711, -31.914703369140625, -30.115449905395508, -28.31619644165039, -26.516944885253906, -24.71769142150879, -22.91843605041504, -21.119182586669922, -19.319931030273438, -17.52067756652832, -15.721424102783203, -13.922170639038086, -12.122918128967285, -10.323665618896484, -8.524412155151367, -6.725159168243408, -4.925906181335449, -3.1266531944274902, -1.3274002075195312, 0.47185325622558594, 2.2711057662963867, 4.0703582763671875, 5.869611740112305, 7.668864727020264, 9.468117713928223, 11.267370223999023, 13.06662368774414, 14.865877151489258, 16.665130615234375, 18.46438217163086, 20.263635635375977]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 2.0, 9.0, 11.0, 7.0, 10.0, 16.0, 21.0, 23.0, 14.0, 34.0, 31.0, 33.0, 33.0, 49.0, 42.0, 34.0, 40.0, 42.0, 44.0, 49.0, 48.0, 45.0, 61.0, 36.0, 45.0, 31.0, 34.0, 26.0, 25.0, 16.0, 13.0, 11.0, 12.0, 12.0, 7.0, 11.0, 6.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.22817611694336, -35.15205764770508, -34.07594299316406, -32.99982452392578, -31.923709869384766, -30.847591400146484, -29.771474838256836, -28.695358276367188, -27.61924171447754, -26.54312515258789, -25.467008590698242, -24.390892028808594, -23.314773559570312, -22.238658905029297, -21.162540435791016, -20.086423873901367, -19.01030731201172, -17.93419075012207, -16.858074188232422, -15.781956672668457, -14.705840110778809, -13.62972354888916, -12.553606033325195, -11.477489471435547, -10.401372909545898, -9.32525634765625, -8.249139785766602, -7.173022270202637, -6.096905708312988, -5.02078914642334, -3.944672107696533, -2.8685550689697266, -1.7924346923828125, -0.716317892074585, 0.3597989082336426, 1.4359157085418701, 2.5120325088500977, 3.588149070739746, 4.664266109466553, 5.740383148193359, 6.816499710083008, 7.892616271972656, 8.968732833862305, 10.04485034942627, 11.120966911315918, 12.197083473205566, 13.273200988769531, 14.34931755065918, 15.425434112548828, 16.501550674438477, 17.577667236328125, 18.653783798217773, 19.729900360107422, 20.806018829345703, 21.88213539123535, 22.958251953125, 24.03436851501465, 25.110485076904297, 26.186601638793945, 27.262718200683594, 28.338836669921875, 29.41495132446289, 30.491069793701172, 31.56718635559082, 32.64330291748047]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 6.0, 7.0, 11.0, 11.0, 16.0, 10.0, 18.0, 20.0, 14.0, 26.0, 29.0, 38.0, 27.0, 33.0, 32.0, 36.0, 43.0, 40.0, 30.0, 48.0, 30.0, 51.0, 47.0, 30.0, 23.0, 35.0, 34.0, 25.0, 34.0, 20.0, 15.0, 17.0, 18.0, 10.0, 16.0, 15.0, 12.0, 6.0, 11.0, 15.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 6.0, 3.0], "bins": [-3.033203125, -2.9478759765625, -2.862548828125, -2.7772216796875, -2.69189453125, -2.6065673828125, -2.521240234375, -2.4359130859375, -2.3505859375, -2.2652587890625, -2.179931640625, -2.0946044921875, -2.00927734375, -1.9239501953125, -1.838623046875, -1.7532958984375, -1.66796875, -1.5826416015625, -1.497314453125, -1.4119873046875, -1.32666015625, -1.2413330078125, -1.156005859375, -1.0706787109375, -0.9853515625, -0.9000244140625, -0.814697265625, -0.7293701171875, -0.64404296875, -0.5587158203125, -0.473388671875, -0.3880615234375, -0.302734375, -0.2174072265625, -0.132080078125, -0.0467529296875, 0.03857421875, 0.1239013671875, 0.209228515625, 0.2945556640625, 0.3798828125, 0.4652099609375, 0.550537109375, 0.6358642578125, 0.72119140625, 0.8065185546875, 0.891845703125, 0.9771728515625, 1.0625, 1.1478271484375, 1.233154296875, 1.3184814453125, 1.40380859375, 1.4891357421875, 1.574462890625, 1.6597900390625, 1.7451171875, 1.8304443359375, 1.915771484375, 2.0010986328125, 2.08642578125, 2.1717529296875, 2.257080078125, 2.3424072265625, 2.427734375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 11.0, 6.0, 6.0, 13.0, 14.0, 22.0, 38.0, 50.0, 88.0, 126.0, 195.0, 293.0, 400.0, 561.0, 844.0, 1280.0, 1888.0, 2699.0, 4042.0, 5897.0, 8733.0, 13083.0, 19707.0, 30710.0, 46931.0, 72198.0, 110736.0, 162771.0, 180899.0, 132650.0, 87331.0, 56157.0, 36448.0, 24038.0, 15645.0, 10310.0, 7097.0, 4680.0, 3007.0, 2153.0, 1570.0, 1040.0, 679.0, 504.0, 299.0, 200.0, 170.0, 124.0, 75.0, 55.0, 35.0, 19.0, 14.0, 14.0, 8.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.220458984375, -0.2138214111328125, -0.207183837890625, -0.2005462646484375, -0.19390869140625, -0.1872711181640625, -0.180633544921875, -0.1739959716796875, -0.1673583984375, -0.1607208251953125, -0.154083251953125, -0.1474456787109375, -0.14080810546875, -0.1341705322265625, -0.127532958984375, -0.1208953857421875, -0.1142578125, -0.1076202392578125, -0.100982666015625, -0.0943450927734375, -0.08770751953125, -0.0810699462890625, -0.074432373046875, -0.0677947998046875, -0.0611572265625, -0.0545196533203125, -0.047882080078125, -0.0412445068359375, -0.03460693359375, -0.0279693603515625, -0.021331787109375, -0.0146942138671875, -0.008056640625, -0.0014190673828125, 0.005218505859375, 0.0118560791015625, 0.01849365234375, 0.0251312255859375, 0.031768798828125, 0.0384063720703125, 0.0450439453125, 0.0516815185546875, 0.058319091796875, 0.0649566650390625, 0.07159423828125, 0.0782318115234375, 0.084869384765625, 0.0915069580078125, 0.09814453125, 0.1047821044921875, 0.111419677734375, 0.1180572509765625, 0.12469482421875, 0.1313323974609375, 0.137969970703125, 0.1446075439453125, 0.1512451171875, 0.1578826904296875, 0.164520263671875, 0.1711578369140625, 0.17779541015625, 0.1844329833984375, 0.191070556640625, 0.1977081298828125, 0.204345703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 3.0, 5.0, 5.0, 7.0, 8.0, 11.0, 11.0, 19.0, 22.0, 27.0, 24.0, 26.0, 20.0, 34.0, 29.0, 35.0, 35.0, 46.0, 32.0, 50.0, 45.0, 1070.0, 52.0, 41.0, 35.0, 34.0, 35.0, 28.0, 28.0, 20.0, 29.0, 21.0, 24.0, 18.0, 18.0, 15.0, 8.0, 8.0, 7.0, 8.0, 11.0, 9.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7548828125, -1.69659423828125, -1.6383056640625, -1.58001708984375, -1.521728515625, -1.46343994140625, -1.4051513671875, -1.34686279296875, -1.28857421875, -1.23028564453125, -1.1719970703125, -1.11370849609375, -1.055419921875, -0.99713134765625, -0.9388427734375, -0.88055419921875, -0.822265625, -0.76397705078125, -0.7056884765625, -0.64739990234375, -0.589111328125, -0.53082275390625, -0.4725341796875, -0.41424560546875, -0.35595703125, -0.29766845703125, -0.2393798828125, -0.18109130859375, -0.122802734375, -0.06451416015625, -0.0062255859375, 0.05206298828125, 0.1103515625, 0.16864013671875, 0.2269287109375, 0.28521728515625, 0.343505859375, 0.40179443359375, 0.4600830078125, 0.51837158203125, 0.57666015625, 0.63494873046875, 0.6932373046875, 0.75152587890625, 0.809814453125, 0.86810302734375, 0.9263916015625, 0.98468017578125, 1.04296875, 1.10125732421875, 1.1595458984375, 1.21783447265625, 1.276123046875, 1.33441162109375, 1.3927001953125, 1.45098876953125, 1.50927734375, 1.56756591796875, 1.6258544921875, 1.68414306640625, 1.742431640625, 1.80072021484375, 1.8590087890625, 1.91729736328125, 1.9755859375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 19.0, 21.0, 19.0, 40.0, 63.0, 90.0, 153.0, 221.0, 402.0, 509.0, 908.0, 1292.0, 2249.0, 3454.0, 5686.0, 8675.0, 13959.0, 21910.0, 34166.0, 53562.0, 85984.0, 134467.0, 1235174.0, 174318.0, 117520.0, 74258.0, 46666.0, 29698.0, 18939.0, 11921.0, 7708.0, 4848.0, 3085.0, 1871.0, 1206.0, 763.0, 471.0, 306.0, 164.0, 124.0, 93.0, 38.0, 34.0, 29.0, 14.0, 11.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1888427734375, -0.18272018432617188, -0.17659759521484375, -0.17047500610351562, -0.1643524169921875, -0.15822982788085938, -0.15210723876953125, -0.14598464965820312, -0.139862060546875, -0.13373947143554688, -0.12761688232421875, -0.12149429321289062, -0.1153717041015625, -0.10924911499023438, -0.10312652587890625, -0.09700393676757812, -0.09088134765625, -0.08475875854492188, -0.07863616943359375, -0.07251358032226562, -0.0663909912109375, -0.060268402099609375, -0.05414581298828125, -0.048023223876953125, -0.041900634765625, -0.035778045654296875, -0.02965545654296875, -0.023532867431640625, -0.0174102783203125, -0.011287689208984375, -0.00516510009765625, 0.000957489013671875, 0.007080078125, 0.013202667236328125, 0.01932525634765625, 0.025447845458984375, 0.0315704345703125, 0.037693023681640625, 0.04381561279296875, 0.049938201904296875, 0.056060791015625, 0.062183380126953125, 0.06830596923828125, 0.07442855834960938, 0.0805511474609375, 0.08667373657226562, 0.09279632568359375, 0.09891891479492188, 0.10504150390625, 0.11116409301757812, 0.11728668212890625, 0.12340927124023438, 0.1295318603515625, 0.13565444946289062, 0.14177703857421875, 0.14789962768554688, 0.154022216796875, 0.16014480590820312, 0.16626739501953125, 0.17238998413085938, 0.1785125732421875, 0.18463516235351562, 0.19075775146484375, 0.19688034057617188, 0.2030029296875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 5.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 10.0, 7.0, 9.0, 12.0, 15.0, 17.0, 19.0, 21.0, 36.0, 44.0, 35.0, 45.0, 43.0, 34.0, 56.0, 59.0, 47.0, 68.0, 60.0, 55.0, 53.0, 47.0, 34.0, 33.0, 25.0, 21.0, 18.0, 17.0, 10.0, 5.0, 11.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006127357482910156, -0.0005902275443077087, -0.0005677193403244019, -0.000545211136341095, -0.0005227029323577881, -0.0005001947283744812, -0.0004776865243911743, -0.00045517832040786743, -0.00043267011642456055, -0.00041016191244125366, -0.0003876537084579468, -0.0003651455044746399, -0.000342637300491333, -0.0003201290965080261, -0.00029762089252471924, -0.00027511268854141235, -0.00025260448455810547, -0.00023009628057479858, -0.0002075880765914917, -0.00018507987260818481, -0.00016257166862487793, -0.00014006346464157104, -0.00011755526065826416, -9.504705667495728e-05, -7.253885269165039e-05, -5.0030648708343506e-05, -2.752244472503662e-05, -5.014240741729736e-06, 1.749396324157715e-05, 4.000216722488403e-05, 6.251037120819092e-05, 8.50185751914978e-05, 0.00010752677917480469, 0.00013003498315811157, 0.00015254318714141846, 0.00017505139112472534, 0.00019755959510803223, 0.0002200677990913391, 0.000242576003074646, 0.0002650842070579529, 0.00028759241104125977, 0.00031010061502456665, 0.00033260881900787354, 0.0003551170229911804, 0.0003776252269744873, 0.0004001334309577942, 0.0004226416349411011, 0.00044514983892440796, 0.00046765804290771484, 0.0004901662468910217, 0.0005126744508743286, 0.0005351826548576355, 0.0005576908588409424, 0.0005801990628242493, 0.0006027072668075562, 0.000625215470790863, 0.0006477236747741699, 0.0006702318787574768, 0.0006927400827407837, 0.0007152482867240906, 0.0007377564907073975, 0.0007602646946907043, 0.0007827728986740112, 0.0008052811026573181, 0.000827789306640625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 6.0, 8.0, 14.0, 18.0, 13.0, 24.0, 41.0, 61.0, 60.0, 71.0, 89.0, 157.0, 186.0, 241.0, 440.0, 1230.0, 206226.0, 835366.0, 2643.0, 452.0, 324.0, 216.0, 145.0, 121.0, 97.0, 62.0, 45.0, 30.0, 34.0, 29.0, 17.0, 15.0, 16.0, 8.0, 7.0, 6.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.01371002197265625, -0.013308525085449219, -0.012907028198242188, -0.012505531311035156, -0.012104034423828125, -0.011702537536621094, -0.011301040649414062, -0.010899543762207031, -0.010498046875, -0.010096549987792969, -0.009695053100585938, -0.009293556213378906, -0.008892059326171875, -0.008490562438964844, -0.008089065551757812, -0.007687568664550781, -0.00728607177734375, -0.006884574890136719, -0.0064830780029296875, -0.006081581115722656, -0.005680084228515625, -0.005278587341308594, -0.0048770904541015625, -0.004475593566894531, -0.0040740966796875, -0.0036725997924804688, -0.0032711029052734375, -0.0028696060180664062, -0.002468109130859375, -0.0020666122436523438, -0.0016651153564453125, -0.0012636184692382812, -0.00086212158203125, -0.00046062469482421875, -5.91278076171875e-05, 0.00034236907958984375, 0.000743865966796875, 0.0011453628540039062, 0.0015468597412109375, 0.0019483566284179688, 0.002349853515625, 0.0027513504028320312, 0.0031528472900390625, 0.0035543441772460938, 0.003955841064453125, 0.004357337951660156, 0.0047588348388671875, 0.005160331726074219, 0.00556182861328125, 0.005963325500488281, 0.0063648223876953125, 0.006766319274902344, 0.007167816162109375, 0.007569313049316406, 0.007970809936523438, 0.008372306823730469, 0.0087738037109375, 0.009175300598144531, 0.009576797485351562, 0.009978294372558594, 0.010379791259765625, 0.010781288146972656, 0.011182785034179688, 0.011584281921386719, 0.01198577880859375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 11.0, 13.0, 21.0, 42.0, 78.0, 107.0, 139.0, 134.0, 152.0, 132.0, 80.0, 47.0, 23.0, 17.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000258095795288682, -0.00024033985391724855, -0.0002225839125458151, -0.0002048279857262969, -0.00018707204435486346, -0.00016931610298343003, -0.00015156017616391182, -0.00013380423479247838, -0.00011604829342104495, -9.829235204961151e-05, -8.053641795413569e-05, -6.278048385865986e-05, -4.5024542487226427e-05, -2.726860111579299e-05, -9.512667020317167e-06, 8.243267075158656e-06, 2.5999208446592093e-05, 4.375514618004672e-05, 6.151108391350135e-05, 7.926701800897717e-05, 9.702295938041061e-05, 0.00011477890075184405, 0.00013253482757136226, 0.0001502907689427957, 0.00016804671031422913, 0.00018580265168566257, 0.000203558593057096, 0.0002213145198766142, 0.00023907046124804765, 0.0002568264026194811, 0.0002745823294389993, 0.0002923382562585175, 0.0003100942703895271, 0.0003278501972090453, 0.00034560615313239396, 0.00036336207995191216, 0.00038111803587526083, 0.00039887396269477904, 0.00041662988951429725, 0.0004343858454376459, 0.0004521417722571641, 0.00046989769907668233, 0.000487653655000031, 0.0005054096109233797, 0.0005231655086390674, 0.0005409214645624161, 0.0005586774204857647, 0.0005764333182014525, 0.0005941892741248012, 0.0006119452300481498, 0.0006297011277638376, 0.0006474570836871862, 0.0006652130396105349, 0.0006829689955338836, 0.0007007248932495713, 0.00071848084917292, 0.0007362368050962687, 0.0007539927610196173, 0.0007717486587353051, 0.0007895046146586537, 0.0008072605705820024, 0.0008250165265053511, 0.0008427724242210388, 0.0008605283801443875, 0.0008782842778600752]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 6.0, 5.0, 4.0, 3.0, 10.0, 11.0, 14.0, 15.0, 20.0, 24.0, 27.0, 19.0, 28.0, 29.0, 35.0, 42.0, 44.0, 42.0, 45.0, 50.0, 42.0, 44.0, 39.0, 41.0, 43.0, 36.0, 43.0, 27.0, 38.0, 31.0, 17.0, 22.0, 18.0, 22.0, 19.0, 10.0, 9.0, 9.0, 8.0, 5.0, 5.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004277229309082031, -0.00041467975825071335, -0.00040163658559322357, -0.0003885934129357338, -0.000375550240278244, -0.00036250706762075424, -0.00034946389496326447, -0.0003364207223057747, -0.0003233775496482849, -0.00031033437699079514, -0.00029729120433330536, -0.0002842480316758156, -0.0002712048590183258, -0.00025816168636083603, -0.00024511851370334625, -0.00023207534104585648, -0.0002190321683883667, -0.00020598899573087692, -0.00019294582307338715, -0.00017990265041589737, -0.0001668594777584076, -0.00015381630510091782, -0.00014077313244342804, -0.00012772995978593826, -0.00011468678712844849, -0.00010164361447095871, -8.860044181346893e-05, -7.555726915597916e-05, -6.251409649848938e-05, -4.94709238409996e-05, -3.642775118350983e-05, -2.338457852602005e-05, -1.0341405868530273e-05, 2.701766788959503e-06, 1.574493944644928e-05, 2.8788112103939056e-05, 4.183128476142883e-05, 5.487445741891861e-05, 6.791763007640839e-05, 8.096080273389816e-05, 9.400397539138794e-05, 0.00010704714804887772, 0.00012009032070636749, 0.00013313349336385727, 0.00014617666602134705, 0.00015921983867883682, 0.0001722630113363266, 0.00018530618399381638, 0.00019834935665130615, 0.00021139252930879593, 0.0002244357019662857, 0.00023747887462377548, 0.00025052204728126526, 0.00026356521993875504, 0.0002766083925962448, 0.0002896515652537346, 0.00030269473791122437, 0.00031573791056871414, 0.0003287810832262039, 0.0003418242558836937, 0.00035486742854118347, 0.00036791060119867325, 0.000380953773856163, 0.0003939969465136528, 0.0004070401191711426]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 6.0, 7.0, 11.0, 11.0, 16.0, 10.0, 18.0, 20.0, 14.0, 26.0, 29.0, 38.0, 27.0, 33.0, 32.0, 36.0, 43.0, 40.0, 30.0, 48.0, 30.0, 51.0, 47.0, 30.0, 23.0, 35.0, 34.0, 25.0, 34.0, 20.0, 15.0, 17.0, 18.0, 10.0, 16.0, 15.0, 12.0, 6.0, 11.0, 15.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 6.0, 3.0], "bins": [-3.033203125, -2.9478759765625, -2.862548828125, -2.7772216796875, -2.69189453125, -2.6065673828125, -2.521240234375, -2.4359130859375, -2.3505859375, -2.2652587890625, -2.179931640625, -2.0946044921875, -2.00927734375, -1.9239501953125, -1.838623046875, -1.7532958984375, -1.66796875, -1.5826416015625, -1.497314453125, -1.4119873046875, -1.32666015625, -1.2413330078125, -1.156005859375, -1.0706787109375, -0.9853515625, -0.9000244140625, -0.814697265625, -0.7293701171875, -0.64404296875, -0.5587158203125, -0.473388671875, -0.3880615234375, -0.302734375, -0.2174072265625, -0.132080078125, -0.0467529296875, 0.03857421875, 0.1239013671875, 0.209228515625, 0.2945556640625, 0.3798828125, 0.4652099609375, 0.550537109375, 0.6358642578125, 0.72119140625, 0.8065185546875, 0.891845703125, 0.9771728515625, 1.0625, 1.1478271484375, 1.233154296875, 1.3184814453125, 1.40380859375, 1.4891357421875, 1.574462890625, 1.6597900390625, 1.7451171875, 1.8304443359375, 1.915771484375, 2.0010986328125, 2.08642578125, 2.1717529296875, 2.257080078125, 2.3424072265625, 2.427734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 17.0, 14.0, 27.0, 26.0, 49.0, 42.0, 64.0, 92.0, 137.0, 203.0, 255.0, 356.0, 560.0, 865.0, 1340.0, 2208.0, 3505.0, 5782.0, 9795.0, 18147.0, 37416.0, 85982.0, 202316.0, 336722.0, 187501.0, 79216.0, 34826.0, 17077.0, 9246.0, 5379.0, 3273.0, 2126.0, 1328.0, 805.0, 550.0, 387.0, 255.0, 178.0, 136.0, 77.0, 68.0, 50.0, 42.0, 39.0, 25.0, 11.0, 11.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0], "bins": [-2.75, -2.662567138671875, -2.57513427734375, -2.487701416015625, -2.4002685546875, -2.312835693359375, -2.22540283203125, -2.137969970703125, -2.050537109375, -1.963104248046875, -1.87567138671875, -1.788238525390625, -1.7008056640625, -1.613372802734375, -1.52593994140625, -1.438507080078125, -1.35107421875, -1.263641357421875, -1.17620849609375, -1.088775634765625, -1.0013427734375, -0.913909912109375, -0.82647705078125, -0.739044189453125, -0.651611328125, -0.564178466796875, -0.47674560546875, -0.389312744140625, -0.3018798828125, -0.214447021484375, -0.12701416015625, -0.039581298828125, 0.0478515625, 0.135284423828125, 0.22271728515625, 0.310150146484375, 0.3975830078125, 0.485015869140625, 0.57244873046875, 0.659881591796875, 0.747314453125, 0.834747314453125, 0.92218017578125, 1.009613037109375, 1.0970458984375, 1.184478759765625, 1.27191162109375, 1.359344482421875, 1.44677734375, 1.534210205078125, 1.62164306640625, 1.709075927734375, 1.7965087890625, 1.883941650390625, 1.97137451171875, 2.058807373046875, 2.146240234375, 2.233673095703125, 2.32110595703125, 2.408538818359375, 2.4959716796875, 2.583404541015625, 2.67083740234375, 2.758270263671875, 2.845703125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 2.0, 4.0, 8.0, 5.0, 10.0, 6.0, 11.0, 12.0, 18.0, 17.0, 22.0, 23.0, 24.0, 37.0, 36.0, 35.0, 35.0, 49.0, 47.0, 85.0, 137.0, 1427.0, 405.0, 114.0, 76.0, 46.0, 51.0, 40.0, 27.0, 30.0, 25.0, 20.0, 30.0, 26.0, 19.0, 7.0, 9.0, 14.0, 15.0, 14.0, 6.0, 5.0, 10.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.796875, -9.4805908203125, -9.164306640625, -8.8480224609375, -8.53173828125, -8.2154541015625, -7.899169921875, -7.5828857421875, -7.2666015625, -6.9503173828125, -6.634033203125, -6.3177490234375, -6.00146484375, -5.6851806640625, -5.368896484375, -5.0526123046875, -4.736328125, -4.4200439453125, -4.103759765625, -3.7874755859375, -3.47119140625, -3.1549072265625, -2.838623046875, -2.5223388671875, -2.2060546875, -1.8897705078125, -1.573486328125, -1.2572021484375, -0.94091796875, -0.6246337890625, -0.308349609375, 0.0079345703125, 0.32421875, 0.6405029296875, 0.956787109375, 1.2730712890625, 1.58935546875, 1.9056396484375, 2.221923828125, 2.5382080078125, 2.8544921875, 3.1707763671875, 3.487060546875, 3.8033447265625, 4.11962890625, 4.4359130859375, 4.752197265625, 5.0684814453125, 5.384765625, 5.7010498046875, 6.017333984375, 6.3336181640625, 6.64990234375, 6.9661865234375, 7.282470703125, 7.5987548828125, 7.9150390625, 8.2313232421875, 8.547607421875, 8.8638916015625, 9.18017578125, 9.4964599609375, 9.812744140625, 10.1290283203125, 10.4453125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 7.0, 10.0, 14.0, 24.0, 18.0, 21.0, 26.0, 63.0, 54.0, 63.0, 103.0, 149.0, 314.0, 756.0, 3734.0, 61550.0, 2975123.0, 97196.0, 4602.0, 879.0, 340.0, 210.0, 106.0, 85.0, 56.0, 40.0, 33.0, 30.0, 19.0, 15.0, 9.0, 10.0, 11.0, 4.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.109375, -21.487548828125, -20.86572265625, -20.243896484375, -19.6220703125, -19.000244140625, -18.37841796875, -17.756591796875, -17.134765625, -16.512939453125, -15.89111328125, -15.269287109375, -14.6474609375, -14.025634765625, -13.40380859375, -12.781982421875, -12.16015625, -11.538330078125, -10.91650390625, -10.294677734375, -9.6728515625, -9.051025390625, -8.42919921875, -7.807373046875, -7.185546875, -6.563720703125, -5.94189453125, -5.320068359375, -4.6982421875, -4.076416015625, -3.45458984375, -2.832763671875, -2.2109375, -1.589111328125, -0.96728515625, -0.345458984375, 0.2763671875, 0.898193359375, 1.52001953125, 2.141845703125, 2.763671875, 3.385498046875, 4.00732421875, 4.629150390625, 5.2509765625, 5.872802734375, 6.49462890625, 7.116455078125, 7.73828125, 8.360107421875, 8.98193359375, 9.603759765625, 10.2255859375, 10.847412109375, 11.46923828125, 12.091064453125, 12.712890625, 13.334716796875, 13.95654296875, 14.578369140625, 15.2001953125, 15.822021484375, 16.44384765625, 17.065673828125, 17.6875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 10.0, 66.0, 258.0, 414.0, 201.0, 52.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.334421157836914, -8.718422889709473, -7.102424621582031, -5.48642635345459, -3.8704280853271484, -2.254429817199707, -0.6384315490722656, 0.9775667190551758, 2.593564987182617, 4.209563255310059, 5.8255615234375, 7.441559791564941, 9.057558059692383, 10.673556327819824, 12.289554595947266, 13.905552864074707, 15.521551132202148, 17.137550354003906, 18.75354766845703, 20.369544982910156, 21.985544204711914, 23.601543426513672, 25.217540740966797, 26.833538055419922, 28.44953727722168, 30.065536499023438, 31.681533813476562, 33.29753112792969, 34.91352844238281, 36.5295295715332, 38.14552688598633, 39.76152420043945, 41.377525329589844, 42.99352264404297, 44.609519958496094, 46.225521087646484, 47.84151840209961, 49.457515716552734, 51.073516845703125, 52.68951416015625, 54.305511474609375, 55.9215087890625, 57.537506103515625, 59.153507232666016, 60.76950454711914, 62.385501861572266, 64.00150299072266, 65.61750030517578, 67.2334976196289, 68.84949493408203, 70.46549224853516, 72.08148956298828, 73.69749450683594, 75.31349182128906, 76.92948913574219, 78.54548645019531, 80.16148376464844, 81.77748107910156, 83.39347839355469, 85.00947570800781, 86.62547302246094, 88.2414779663086, 89.85747528076172, 91.47347259521484, 93.08946990966797]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 7.0, 12.0, 11.0, 9.0, 10.0, 11.0, 16.0, 13.0, 16.0, 32.0, 31.0, 34.0, 35.0, 48.0, 35.0, 30.0, 39.0, 35.0, 27.0, 35.0, 36.0, 32.0, 52.0, 34.0, 32.0, 29.0, 29.0, 30.0, 42.0, 25.0, 25.0, 19.0, 18.0, 21.0, 11.0, 8.0, 11.0, 7.0, 13.0, 5.0, 9.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.35616683959961, -28.36530113220215, -27.37443733215332, -26.38357162475586, -25.39270782470703, -24.40184211730957, -23.41097640991211, -22.42011260986328, -21.429248809814453, -20.438383102416992, -19.447519302368164, -18.456653594970703, -17.465789794921875, -16.474924087524414, -15.48405933380127, -14.493194580078125, -13.502328872680664, -12.51146411895752, -11.520599365234375, -10.529733657836914, -9.538869857788086, -8.548004150390625, -7.5571393966674805, -6.566274642944336, -5.575409889221191, -4.584545135498047, -3.5936801433563232, -2.6028151512145996, -1.611950397491455, -0.6210856437683105, 0.3697795867919922, 1.3606443405151367, 2.3515090942382812, 3.342373847961426, 4.33323860168457, 5.324103832244873, 6.314968585968018, 7.305833339691162, 8.296698570251465, 9.28756332397461, 10.278428077697754, 11.269292831420898, 12.260157585144043, 13.251022338867188, 14.241888046264648, 15.232751846313477, 16.223617553710938, 17.214481353759766, 18.205347061157227, 19.196212768554688, 20.187076568603516, 21.177942276000977, 22.168806076049805, 23.159671783447266, 24.150535583496094, 25.141401290893555, 26.132266998291016, 27.123132705688477, 28.113996505737305, 29.104862213134766, 30.095726013183594, 31.086591720581055, 32.077457427978516, 33.068321228027344, 34.05918502807617]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 9.0, 12.0, 11.0, 11.0, 8.0, 15.0, 18.0, 20.0, 25.0, 29.0, 28.0, 30.0, 24.0, 39.0, 39.0, 42.0, 37.0, 44.0, 50.0, 40.0, 31.0, 48.0, 42.0, 35.0, 34.0, 30.0, 26.0, 29.0, 19.0, 20.0, 16.0, 12.0, 21.0, 19.0, 10.0, 11.0, 12.0, 8.0, 9.0, 3.0, 4.0, 4.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0], "bins": [-3.267578125, -3.173675537109375, -3.07977294921875, -2.985870361328125, -2.8919677734375, -2.798065185546875, -2.70416259765625, -2.610260009765625, -2.516357421875, -2.422454833984375, -2.32855224609375, -2.234649658203125, -2.1407470703125, -2.046844482421875, -1.95294189453125, -1.859039306640625, -1.76513671875, -1.671234130859375, -1.57733154296875, -1.483428955078125, -1.3895263671875, -1.295623779296875, -1.20172119140625, -1.107818603515625, -1.013916015625, -0.920013427734375, -0.82611083984375, -0.732208251953125, -0.6383056640625, -0.544403076171875, -0.45050048828125, -0.356597900390625, -0.2626953125, -0.168792724609375, -0.07489013671875, 0.019012451171875, 0.1129150390625, 0.206817626953125, 0.30072021484375, 0.394622802734375, 0.488525390625, 0.582427978515625, 0.67633056640625, 0.770233154296875, 0.8641357421875, 0.958038330078125, 1.05194091796875, 1.145843505859375, 1.23974609375, 1.333648681640625, 1.42755126953125, 1.521453857421875, 1.6153564453125, 1.709259033203125, 1.80316162109375, 1.897064208984375, 1.990966796875, 2.084869384765625, 2.17877197265625, 2.272674560546875, 2.3665771484375, 2.460479736328125, 2.55438232421875, 2.648284912109375, 2.7421875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 6.0, 7.0, 8.0, 8.0, 10.0, 8.0, 11.0, 11.0, 18.0, 23.0, 25.0, 35.0, 37.0, 55.0, 104.0, 165.0, 503.0, 1977.0, 14027.0, 195908.0, 3007820.0, 923884.0, 43475.0, 4604.0, 869.0, 246.0, 126.0, 63.0, 49.0, 33.0, 25.0, 13.0, 21.0, 14.0, 16.0, 12.0, 11.0, 10.0, 10.0, 5.0, 5.0, 7.0, 1.0, 3.0, 5.0, 2.0, 4.0, 0.0, 3.0], "bins": [-15.25, -14.8232421875, -14.396484375, -13.9697265625, -13.54296875, -13.1162109375, -12.689453125, -12.2626953125, -11.8359375, -11.4091796875, -10.982421875, -10.5556640625, -10.12890625, -9.7021484375, -9.275390625, -8.8486328125, -8.421875, -7.9951171875, -7.568359375, -7.1416015625, -6.71484375, -6.2880859375, -5.861328125, -5.4345703125, -5.0078125, -4.5810546875, -4.154296875, -3.7275390625, -3.30078125, -2.8740234375, -2.447265625, -2.0205078125, -1.59375, -1.1669921875, -0.740234375, -0.3134765625, 0.11328125, 0.5400390625, 0.966796875, 1.3935546875, 1.8203125, 2.2470703125, 2.673828125, 3.1005859375, 3.52734375, 3.9541015625, 4.380859375, 4.8076171875, 5.234375, 5.6611328125, 6.087890625, 6.5146484375, 6.94140625, 7.3681640625, 7.794921875, 8.2216796875, 8.6484375, 9.0751953125, 9.501953125, 9.9287109375, 10.35546875, 10.7822265625, 11.208984375, 11.6357421875, 12.0625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 10.0, 10.0, 8.0, 22.0, 35.0, 32.0, 57.0, 85.0, 120.0, 152.0, 246.0, 319.0, 436.0, 486.0, 510.0, 391.0, 349.0, 251.0, 162.0, 122.0, 81.0, 56.0, 43.0, 27.0, 28.0, 13.0, 8.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.9718017578125, -11.638916015625, -11.3060302734375, -10.97314453125, -10.6402587890625, -10.307373046875, -9.9744873046875, -9.6416015625, -9.3087158203125, -8.975830078125, -8.6429443359375, -8.31005859375, -7.9771728515625, -7.644287109375, -7.3114013671875, -6.978515625, -6.6456298828125, -6.312744140625, -5.9798583984375, -5.64697265625, -5.3140869140625, -4.981201171875, -4.6483154296875, -4.3154296875, -3.9825439453125, -3.649658203125, -3.3167724609375, -2.98388671875, -2.6510009765625, -2.318115234375, -1.9852294921875, -1.65234375, -1.3194580078125, -0.986572265625, -0.6536865234375, -0.32080078125, 0.0120849609375, 0.344970703125, 0.6778564453125, 1.0107421875, 1.3436279296875, 1.676513671875, 2.0093994140625, 2.34228515625, 2.6751708984375, 3.008056640625, 3.3409423828125, 3.673828125, 4.0067138671875, 4.339599609375, 4.6724853515625, 5.00537109375, 5.3382568359375, 5.671142578125, 6.0040283203125, 6.3369140625, 6.6697998046875, 7.002685546875, 7.3355712890625, 7.66845703125, 8.0013427734375, 8.334228515625, 8.6671142578125, 9.0]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 7.0, 11.0, 14.0, 17.0, 18.0, 36.0, 61.0, 77.0, 127.0, 206.0, 395.0, 904.0, 3292.0, 27319.0, 506738.0, 3282627.0, 347868.0, 20192.0, 2721.0, 795.0, 361.0, 168.0, 118.0, 78.0, 33.0, 32.0, 17.0, 12.0, 11.0, 8.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.453125, -16.739013671875, -16.02490234375, -15.310791015625, -14.5966796875, -13.882568359375, -13.16845703125, -12.454345703125, -11.740234375, -11.026123046875, -10.31201171875, -9.597900390625, -8.8837890625, -8.169677734375, -7.45556640625, -6.741455078125, -6.02734375, -5.313232421875, -4.59912109375, -3.885009765625, -3.1708984375, -2.456787109375, -1.74267578125, -1.028564453125, -0.314453125, 0.399658203125, 1.11376953125, 1.827880859375, 2.5419921875, 3.256103515625, 3.97021484375, 4.684326171875, 5.3984375, 6.112548828125, 6.82666015625, 7.540771484375, 8.2548828125, 8.968994140625, 9.68310546875, 10.397216796875, 11.111328125, 11.825439453125, 12.53955078125, 13.253662109375, 13.9677734375, 14.681884765625, 15.39599609375, 16.110107421875, 16.82421875, 17.538330078125, 18.25244140625, 18.966552734375, 19.6806640625, 20.394775390625, 21.10888671875, 21.822998046875, 22.537109375, 23.251220703125, 23.96533203125, 24.679443359375, 25.3935546875, 26.107666015625, 26.82177734375, 27.535888671875, 28.25]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 10.0, 53.0, 154.0, 264.0, 284.0, 172.0, 56.0, 18.0, 2.0, 2.0], "bins": [-215.17364501953125, -211.4653778076172, -207.75711059570312, -204.04884338378906, -200.340576171875, -196.63230895996094, -192.92404174804688, -189.21578979492188, -185.50750732421875, -181.7992401123047, -178.09097290039062, -174.38270568847656, -170.6744384765625, -166.96617126464844, -163.25790405273438, -159.54965209960938, -155.8413848876953, -152.13311767578125, -148.4248504638672, -144.71658325195312, -141.00831604003906, -137.300048828125, -133.59178161621094, -129.88351440429688, -126.17525482177734, -122.46698760986328, -118.75872039794922, -115.05045318603516, -111.34219360351562, -107.63392639160156, -103.9256591796875, -100.21739196777344, -96.50912475585938, -92.80085754394531, -89.09259033203125, -85.38432312011719, -81.67605590820312, -77.96778869628906, -74.25952911376953, -70.55126190185547, -66.8429946899414, -63.134727478027344, -59.42646026611328, -55.718196868896484, -52.00992965698242, -48.30166244506836, -44.59339904785156, -40.8851318359375, -37.17686462402344, -33.468597412109375, -29.760332107543945, -26.052066802978516, -22.343799591064453, -18.63553237915039, -14.927267074584961, -11.219001770019531, -7.510736465454102, -3.8024702072143555, -0.09420394897460938, 3.6140623092651367, 7.322328567504883, 11.030595779418945, 14.738861083984375, 18.447126388549805, 22.155393600463867]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 15.0, 12.0, 11.0, 11.0, 13.0, 20.0, 25.0, 31.0, 29.0, 29.0, 30.0, 31.0, 44.0, 44.0, 50.0, 52.0, 33.0, 50.0, 33.0, 38.0, 49.0, 40.0, 35.0, 50.0, 30.0, 19.0, 31.0, 21.0, 16.0, 27.0, 21.0, 8.0, 10.0, 14.0, 5.0, 6.0, 1.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-35.61521530151367, -34.57433319091797, -33.533451080322266, -32.49257278442383, -31.451690673828125, -30.410808563232422, -29.36992645263672, -28.329044342041016, -27.288164138793945, -26.247282028198242, -25.206401824951172, -24.16551971435547, -23.124637603759766, -22.083757400512695, -21.042875289916992, -20.001995086669922, -18.96111297607422, -17.920230865478516, -16.879350662231445, -15.838468551635742, -14.797587394714355, -13.756706237792969, -12.715824127197266, -11.674942970275879, -10.634061813354492, -9.593180656433105, -8.552299499511719, -7.511417388916016, -6.470536231994629, -5.429655075073242, -4.388773441314697, -3.3478918075561523, -2.3070106506347656, -1.2661292552947998, -0.22524785995483398, 0.8156335353851318, 1.8565149307250977, 2.8973960876464844, 3.9382777214050293, 4.979159355163574, 6.020040512084961, 7.060921669006348, 8.101802825927734, 9.142684936523438, 10.183566093444824, 11.224447250366211, 12.265329360961914, 13.3062105178833, 14.347091674804688, 15.387972831726074, 16.42885398864746, 17.469736099243164, 18.510616302490234, 19.551498413085938, 20.59238052368164, 21.633262634277344, 22.674142837524414, 23.715024948120117, 24.755905151367188, 25.79678726196289, 26.837669372558594, 27.878549575805664, 28.919431686401367, 29.960311889648438, 31.00119400024414]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 4.0, 10.0, 12.0, 13.0, 11.0, 20.0, 20.0, 19.0, 15.0, 30.0, 32.0, 39.0, 34.0, 37.0, 47.0, 46.0, 49.0, 52.0, 56.0, 50.0, 35.0, 35.0, 35.0, 30.0, 36.0, 37.0, 23.0, 21.0, 30.0, 27.0, 11.0, 12.0, 16.0, 5.0, 8.0, 6.0, 9.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.501953125, -3.39263916015625, -3.2833251953125, -3.17401123046875, -3.064697265625, -2.95538330078125, -2.8460693359375, -2.73675537109375, -2.62744140625, -2.51812744140625, -2.4088134765625, -2.29949951171875, -2.190185546875, -2.08087158203125, -1.9715576171875, -1.86224365234375, -1.7529296875, -1.64361572265625, -1.5343017578125, -1.42498779296875, -1.315673828125, -1.20635986328125, -1.0970458984375, -0.98773193359375, -0.87841796875, -0.76910400390625, -0.6597900390625, -0.55047607421875, -0.441162109375, -0.33184814453125, -0.2225341796875, -0.11322021484375, -0.00390625, 0.10540771484375, 0.2147216796875, 0.32403564453125, 0.433349609375, 0.54266357421875, 0.6519775390625, 0.76129150390625, 0.87060546875, 0.97991943359375, 1.0892333984375, 1.19854736328125, 1.307861328125, 1.41717529296875, 1.5264892578125, 1.63580322265625, 1.7451171875, 1.85443115234375, 1.9637451171875, 2.07305908203125, 2.182373046875, 2.29168701171875, 2.4010009765625, 2.51031494140625, 2.61962890625, 2.72894287109375, 2.8382568359375, 2.94757080078125, 3.056884765625, 3.16619873046875, 3.2755126953125, 3.38482666015625, 3.494140625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 4.0, 9.0, 8.0, 41.0, 31.0, 46.0, 90.0, 121.0, 193.0, 279.0, 461.0, 813.0, 1230.0, 2053.0, 3447.0, 5543.0, 9546.0, 16394.0, 28446.0, 49717.0, 88671.0, 159010.0, 247651.0, 188434.0, 105725.0, 59559.0, 33763.0, 19333.0, 11296.0, 6481.0, 3911.0, 2304.0, 1420.0, 962.0, 549.0, 363.0, 253.0, 142.0, 93.0, 56.0, 48.0, 27.0, 18.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27783203125, -0.26813507080078125, -0.2584381103515625, -0.24874114990234375, -0.239044189453125, -0.22934722900390625, -0.2196502685546875, -0.20995330810546875, -0.20025634765625, -0.19055938720703125, -0.1808624267578125, -0.17116546630859375, -0.161468505859375, -0.15177154541015625, -0.1420745849609375, -0.13237762451171875, -0.1226806640625, -0.11298370361328125, -0.1032867431640625, -0.09358978271484375, -0.083892822265625, -0.07419586181640625, -0.0644989013671875, -0.05480194091796875, -0.04510498046875, -0.03540802001953125, -0.0257110595703125, -0.01601409912109375, -0.006317138671875, 0.00337982177734375, 0.0130767822265625, 0.02277374267578125, 0.032470703125, 0.04216766357421875, 0.0518646240234375, 0.06156158447265625, 0.071258544921875, 0.08095550537109375, 0.0906524658203125, 0.10034942626953125, 0.11004638671875, 0.11974334716796875, 0.1294403076171875, 0.13913726806640625, 0.148834228515625, 0.15853118896484375, 0.1682281494140625, 0.17792510986328125, 0.1876220703125, 0.19731903076171875, 0.2070159912109375, 0.21671295166015625, 0.226409912109375, 0.23610687255859375, 0.2458038330078125, 0.25550079345703125, 0.26519775390625, 0.27489471435546875, 0.2845916748046875, 0.29428863525390625, 0.303985595703125, 0.31368255615234375, 0.3233795166015625, 0.33307647705078125, 0.3427734375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 15.0, 8.0, 10.0, 14.0, 17.0, 26.0, 20.0, 33.0, 31.0, 26.0, 28.0, 31.0, 41.0, 49.0, 40.0, 48.0, 51.0, 1058.0, 56.0, 42.0, 40.0, 40.0, 35.0, 38.0, 33.0, 26.0, 23.0, 33.0, 20.0, 17.0, 15.0, 8.0, 12.0, 4.0, 10.0, 4.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.490234375, -2.419677734375, -2.34912109375, -2.278564453125, -2.2080078125, -2.137451171875, -2.06689453125, -1.996337890625, -1.92578125, -1.855224609375, -1.78466796875, -1.714111328125, -1.6435546875, -1.572998046875, -1.50244140625, -1.431884765625, -1.361328125, -1.290771484375, -1.22021484375, -1.149658203125, -1.0791015625, -1.008544921875, -0.93798828125, -0.867431640625, -0.796875, -0.726318359375, -0.65576171875, -0.585205078125, -0.5146484375, -0.444091796875, -0.37353515625, -0.302978515625, -0.232421875, -0.161865234375, -0.09130859375, -0.020751953125, 0.0498046875, 0.120361328125, 0.19091796875, 0.261474609375, 0.33203125, 0.402587890625, 0.47314453125, 0.543701171875, 0.6142578125, 0.684814453125, 0.75537109375, 0.825927734375, 0.896484375, 0.967041015625, 1.03759765625, 1.108154296875, 1.1787109375, 1.249267578125, 1.31982421875, 1.390380859375, 1.4609375, 1.531494140625, 1.60205078125, 1.672607421875, 1.7431640625, 1.813720703125, 1.88427734375, 1.954833984375, 2.025390625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 9.0, 17.0, 27.0, 31.0, 56.0, 78.0, 123.0, 193.0, 304.0, 452.0, 637.0, 982.0, 1443.0, 2249.0, 3413.0, 5239.0, 7943.0, 12191.0, 18992.0, 28634.0, 43944.0, 66515.0, 99723.0, 144830.0, 1220891.0, 144137.0, 100548.0, 66095.0, 43783.0, 29028.0, 18894.0, 12316.0, 8045.0, 5324.0, 3377.0, 2229.0, 1581.0, 961.0, 633.0, 423.0, 266.0, 186.0, 128.0, 92.0, 62.0, 33.0, 27.0, 13.0, 13.0, 11.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.202392578125, -0.1961650848388672, -0.18993759155273438, -0.18371009826660156, -0.17748260498046875, -0.17125511169433594, -0.16502761840820312, -0.1588001251220703, -0.1525726318359375, -0.1463451385498047, -0.14011764526367188, -0.13389015197753906, -0.12766265869140625, -0.12143516540527344, -0.11520767211914062, -0.10898017883300781, -0.102752685546875, -0.09652519226074219, -0.09029769897460938, -0.08407020568847656, -0.07784271240234375, -0.07161521911621094, -0.06538772583007812, -0.05916023254394531, -0.0529327392578125, -0.04670524597167969, -0.040477752685546875, -0.03425025939941406, -0.02802276611328125, -0.021795272827148438, -0.015567779541015625, -0.009340286254882812, -0.00311279296875, 0.0031147003173828125, 0.009342193603515625, 0.015569686889648438, 0.02179718017578125, 0.028024673461914062, 0.034252166748046875, 0.04047966003417969, 0.0467071533203125, 0.05293464660644531, 0.059162139892578125, 0.06538963317871094, 0.07161712646484375, 0.07784461975097656, 0.08407211303710938, 0.09029960632324219, 0.096527099609375, 0.10275459289550781, 0.10898208618164062, 0.11520957946777344, 0.12143707275390625, 0.12766456604003906, 0.13389205932617188, 0.1401195526123047, 0.1463470458984375, 0.1525745391845703, 0.15880203247070312, 0.16502952575683594, 0.17125701904296875, 0.17748451232910156, 0.18371200561523438, 0.1899394989013672, 0.1961669921875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 12.0, 6.0, 11.0, 16.0, 21.0, 18.0, 35.0, 40.0, 42.0, 57.0, 65.0, 60.0, 71.0, 93.0, 66.0, 75.0, 67.0, 50.0, 30.0, 26.0, 24.0, 15.0, 16.0, 22.0, 11.0, 11.0, 4.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009241104125976562, -0.0008934289216995239, -0.0008627474308013916, -0.0008320659399032593, -0.000801384449005127, -0.0007707029581069946, -0.0007400214672088623, -0.00070933997631073, -0.0006786584854125977, -0.0006479769945144653, -0.000617295503616333, -0.0005866140127182007, -0.0005559325218200684, -0.000525251030921936, -0.0004945695400238037, -0.0004638880491256714, -0.00043320655822753906, -0.00040252506732940674, -0.0003718435764312744, -0.0003411620855331421, -0.00031048059463500977, -0.00027979910373687744, -0.0002491176128387451, -0.0002184361219406128, -0.00018775463104248047, -0.00015707314014434814, -0.00012639164924621582, -9.57101583480835e-05, -6.502866744995117e-05, -3.434717655181885e-05, -3.6656856536865234e-06, 2.70158052444458e-05, 5.7697296142578125e-05, 8.837878704071045e-05, 0.00011906027793884277, 0.0001497417688369751, 0.00018042325973510742, 0.00021110475063323975, 0.00024178624153137207, 0.0002724677324295044, 0.0003031492233276367, 0.00033383071422576904, 0.00036451220512390137, 0.0003951936960220337, 0.000425875186920166, 0.00045655667781829834, 0.00048723816871643066, 0.000517919659614563, 0.0005486011505126953, 0.0005792826414108276, 0.00060996413230896, 0.0006406456232070923, 0.0006713271141052246, 0.0007020086050033569, 0.0007326900959014893, 0.0007633715867996216, 0.0007940530776977539, 0.0008247345685958862, 0.0008554160594940186, 0.0008860975503921509, 0.0009167790412902832, 0.0009474605321884155, 0.0009781420230865479, 0.0010088235139846802, 0.0010395050048828125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 6.0, 8.0, 6.0, 11.0, 9.0, 19.0, 16.0, 30.0, 34.0, 40.0, 64.0, 72.0, 99.0, 179.0, 257.0, 432.0, 1152.0, 251001.0, 791714.0, 2006.0, 479.0, 273.0, 187.0, 118.0, 76.0, 68.0, 65.0, 40.0, 18.0, 16.0, 14.0, 5.0, 7.0, 9.0, 10.0, 2.0, 1.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0186767578125, -0.018144726753234863, -0.017612695693969727, -0.01708066463470459, -0.016548633575439453, -0.016016602516174316, -0.01548457145690918, -0.014952540397644043, -0.014420509338378906, -0.01388847827911377, -0.013356447219848633, -0.012824416160583496, -0.01229238510131836, -0.011760354042053223, -0.011228322982788086, -0.01069629192352295, -0.010164260864257812, -0.009632229804992676, -0.009100198745727539, -0.008568167686462402, -0.008036136627197266, -0.007504105567932129, -0.006972074508666992, -0.0064400434494018555, -0.005908012390136719, -0.005375981330871582, -0.004843950271606445, -0.004311919212341309, -0.003779888153076172, -0.003247857093811035, -0.0027158260345458984, -0.0021837949752807617, -0.001651763916015625, -0.0011197328567504883, -0.0005877017974853516, -5.5670738220214844e-05, 0.0004763603210449219, 0.0010083913803100586, 0.0015404224395751953, 0.002072453498840332, 0.0026044845581054688, 0.0031365156173706055, 0.003668546676635742, 0.004200577735900879, 0.004732608795166016, 0.005264639854431152, 0.005796670913696289, 0.006328701972961426, 0.0068607330322265625, 0.007392764091491699, 0.007924795150756836, 0.008456826210021973, 0.00898885726928711, 0.009520888328552246, 0.010052919387817383, 0.01058495044708252, 0.011116981506347656, 0.011649012565612793, 0.01218104362487793, 0.012713074684143066, 0.013245105743408203, 0.01377713680267334, 0.014309167861938477, 0.014841198921203613, 0.01537322998046875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 29.0, 263.0, 560.0, 153.0, 8.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009381965501233935, -0.0008477285737171769, -0.0007572606555186212, -0.0006667927373200655, -0.0005763247609138489, -0.0004858568136114627, -0.00039538886630907655, -0.00030492094811052084, -0.00021445297170430422, -0.00012398502440191805, -3.351707709953189e-05, 5.6950870202854276e-05, 0.00014741881750524044, 0.0002378867648076266, 0.00032835471211001277, 0.0004188226303085685, 0.0005092906067147851, 0.0005997585831210017, 0.0006902265013195574, 0.0007806944195181131, 0.0008711623959243298, 0.0009616303723305464, 0.001052098348736763, 0.0011425662087276578, 0.0012330341851338744, 0.001323502161540091, 0.0014139700215309858, 0.0015044379979372025, 0.001594905974343419, 0.0016853739507496357, 0.0017758419271558523, 0.0018663097871467471, 0.001956777647137642, 0.0020472456235438585, 0.002137713599950075, 0.0022281815763562918, 0.0023186495527625084, 0.0024091172963380814, 0.002499585272744298, 0.0025900532491505146, 0.0026805212255567312, 0.002770989201962948, 0.0028614571783691645, 0.002951925154775381, 0.003042392898350954, 0.0031328608747571707, 0.0032233288511633873, 0.003313796827569604, 0.0034042648039758205, 0.003494732780382037, 0.003585200756788254, 0.0036756687331944704, 0.003766136709600687, 0.00385660445317626, 0.00394707266241312, 0.004037540405988693, 0.004128008149564266, 0.004218475893139839, 0.0043089441023766994, 0.004399411845952272, 0.004489880055189133, 0.004580347798764706, 0.004670816008001566, 0.004761283751577139, 0.004851751960813999]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 5.0, 5.0, 10.0, 12.0, 10.0, 17.0, 20.0, 19.0, 22.0, 22.0, 26.0, 25.0, 23.0, 33.0, 36.0, 36.0, 43.0, 34.0, 30.0, 25.0, 35.0, 57.0, 32.0, 47.0, 42.0, 39.0, 35.0, 36.0, 36.0, 21.0, 27.0, 21.0, 16.0, 18.0, 12.0, 12.0, 12.0, 12.0, 6.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0004127621650695801, -0.00039967894554138184, -0.0003865957260131836, -0.00037351250648498535, -0.0003604292869567871, -0.00034734606742858887, -0.0003342628479003906, -0.0003211796283721924, -0.00030809640884399414, -0.0002950131893157959, -0.00028192996978759766, -0.0002688467502593994, -0.00025576353073120117, -0.00024268031120300293, -0.0002295970916748047, -0.00021651387214660645, -0.0002034306526184082, -0.00019034743309020996, -0.00017726421356201172, -0.00016418099403381348, -0.00015109777450561523, -0.000138014554977417, -0.00012493133544921875, -0.00011184811592102051, -9.876489639282227e-05, -8.568167686462402e-05, -7.259845733642578e-05, -5.951523780822754e-05, -4.64320182800293e-05, -3.3348798751831055e-05, -2.0265579223632812e-05, -7.18235969543457e-06, 5.900859832763672e-06, 1.8984079360961914e-05, 3.2067298889160156e-05, 4.51505184173584e-05, 5.823373794555664e-05, 7.131695747375488e-05, 8.440017700195312e-05, 9.748339653015137e-05, 0.00011056661605834961, 0.00012364983558654785, 0.0001367330551147461, 0.00014981627464294434, 0.00016289949417114258, 0.00017598271369934082, 0.00018906593322753906, 0.0002021491527557373, 0.00021523237228393555, 0.0002283155918121338, 0.00024139881134033203, 0.0002544820308685303, 0.0002675652503967285, 0.00028064846992492676, 0.000293731689453125, 0.00030681490898132324, 0.0003198981285095215, 0.0003329813480377197, 0.00034606456756591797, 0.0003591477870941162, 0.00037223100662231445, 0.0003853142261505127, 0.00039839744567871094, 0.0004114806652069092, 0.0004245638847351074]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 4.0, 10.0, 12.0, 13.0, 11.0, 20.0, 20.0, 19.0, 15.0, 30.0, 32.0, 39.0, 34.0, 37.0, 47.0, 46.0, 49.0, 52.0, 56.0, 50.0, 35.0, 35.0, 35.0, 30.0, 36.0, 37.0, 23.0, 21.0, 30.0, 27.0, 11.0, 12.0, 16.0, 5.0, 8.0, 6.0, 9.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.501953125, -3.39263916015625, -3.2833251953125, -3.17401123046875, -3.064697265625, -2.95538330078125, -2.8460693359375, -2.73675537109375, -2.62744140625, -2.51812744140625, -2.4088134765625, -2.29949951171875, -2.190185546875, -2.08087158203125, -1.9715576171875, -1.86224365234375, -1.7529296875, -1.64361572265625, -1.5343017578125, -1.42498779296875, -1.315673828125, -1.20635986328125, -1.0970458984375, -0.98773193359375, -0.87841796875, -0.76910400390625, -0.6597900390625, -0.55047607421875, -0.441162109375, -0.33184814453125, -0.2225341796875, -0.11322021484375, -0.00390625, 0.10540771484375, 0.2147216796875, 0.32403564453125, 0.433349609375, 0.54266357421875, 0.6519775390625, 0.76129150390625, 0.87060546875, 0.97991943359375, 1.0892333984375, 1.19854736328125, 1.307861328125, 1.41717529296875, 1.5264892578125, 1.63580322265625, 1.7451171875, 1.85443115234375, 1.9637451171875, 2.07305908203125, 2.182373046875, 2.29168701171875, 2.4010009765625, 2.51031494140625, 2.61962890625, 2.72894287109375, 2.8382568359375, 2.94757080078125, 3.056884765625, 3.16619873046875, 3.2755126953125, 3.38482666015625, 3.494140625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 10.0, 7.0, 7.0, 12.0, 14.0, 21.0, 32.0, 42.0, 68.0, 94.0, 116.0, 164.0, 237.0, 391.0, 601.0, 1097.0, 2213.0, 5040.0, 12610.0, 38251.0, 157383.0, 498071.0, 245884.0, 56383.0, 17243.0, 6437.0, 2741.0, 1295.0, 725.0, 436.0, 276.0, 165.0, 123.0, 100.0, 75.0, 56.0, 33.0, 22.0, 23.0, 12.0, 12.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.93359375, -4.79119873046875, -4.6488037109375, -4.50640869140625, -4.364013671875, -4.22161865234375, -4.0792236328125, -3.93682861328125, -3.79443359375, -3.65203857421875, -3.5096435546875, -3.36724853515625, -3.224853515625, -3.08245849609375, -2.9400634765625, -2.79766845703125, -2.6552734375, -2.51287841796875, -2.3704833984375, -2.22808837890625, -2.085693359375, -1.94329833984375, -1.8009033203125, -1.65850830078125, -1.51611328125, -1.37371826171875, -1.2313232421875, -1.08892822265625, -0.946533203125, -0.80413818359375, -0.6617431640625, -0.51934814453125, -0.376953125, -0.23455810546875, -0.0921630859375, 0.05023193359375, 0.192626953125, 0.33502197265625, 0.4774169921875, 0.61981201171875, 0.76220703125, 0.90460205078125, 1.0469970703125, 1.18939208984375, 1.331787109375, 1.47418212890625, 1.6165771484375, 1.75897216796875, 1.9013671875, 2.04376220703125, 2.1861572265625, 2.32855224609375, 2.470947265625, 2.61334228515625, 2.7557373046875, 2.89813232421875, 3.04052734375, 3.18292236328125, 3.3253173828125, 3.46771240234375, 3.610107421875, 3.75250244140625, 3.8948974609375, 4.03729248046875, 4.1796875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 2.0, 14.0, 6.0, 8.0, 17.0, 18.0, 21.0, 17.0, 35.0, 29.0, 45.0, 48.0, 51.0, 60.0, 104.0, 298.0, 1667.0, 157.0, 68.0, 57.0, 56.0, 38.0, 46.0, 32.0, 23.0, 24.0, 27.0, 20.0, 12.0, 19.0, 9.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.875, -14.4141845703125, -13.953369140625, -13.4925537109375, -13.03173828125, -12.5709228515625, -12.110107421875, -11.6492919921875, -11.1884765625, -10.7276611328125, -10.266845703125, -9.8060302734375, -9.34521484375, -8.8843994140625, -8.423583984375, -7.9627685546875, -7.501953125, -7.0411376953125, -6.580322265625, -6.1195068359375, -5.65869140625, -5.1978759765625, -4.737060546875, -4.2762451171875, -3.8154296875, -3.3546142578125, -2.893798828125, -2.4329833984375, -1.97216796875, -1.5113525390625, -1.050537109375, -0.5897216796875, -0.12890625, 0.3319091796875, 0.792724609375, 1.2535400390625, 1.71435546875, 2.1751708984375, 2.635986328125, 3.0968017578125, 3.5576171875, 4.0184326171875, 4.479248046875, 4.9400634765625, 5.40087890625, 5.8616943359375, 6.322509765625, 6.7833251953125, 7.244140625, 7.7049560546875, 8.165771484375, 8.6265869140625, 9.08740234375, 9.5482177734375, 10.009033203125, 10.4698486328125, 10.9306640625, 11.3914794921875, 11.852294921875, 12.3131103515625, 12.77392578125, 13.2347412109375, 13.695556640625, 14.1563720703125, 14.6171875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 8.0, 8.0, 14.0, 21.0, 11.0, 37.0, 31.0, 36.0, 41.0, 60.0, 101.0, 175.0, 333.0, 860.0, 4420.0, 134230.0, 2976153.0, 25836.0, 2106.0, 534.0, 234.0, 126.0, 81.0, 54.0, 34.0, 29.0, 26.0, 19.0, 21.0, 14.0, 12.0, 9.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.30712890625, -19.6142578125, -18.92138671875, -18.228515625, -17.53564453125, -16.8427734375, -16.14990234375, -15.45703125, -14.76416015625, -14.0712890625, -13.37841796875, -12.685546875, -11.99267578125, -11.2998046875, -10.60693359375, -9.9140625, -9.22119140625, -8.5283203125, -7.83544921875, -7.142578125, -6.44970703125, -5.7568359375, -5.06396484375, -4.37109375, -3.67822265625, -2.9853515625, -2.29248046875, -1.599609375, -0.90673828125, -0.2138671875, 0.47900390625, 1.171875, 1.86474609375, 2.5576171875, 3.25048828125, 3.943359375, 4.63623046875, 5.3291015625, 6.02197265625, 6.71484375, 7.40771484375, 8.1005859375, 8.79345703125, 9.486328125, 10.17919921875, 10.8720703125, 11.56494140625, 12.2578125, 12.95068359375, 13.6435546875, 14.33642578125, 15.029296875, 15.72216796875, 16.4150390625, 17.10791015625, 17.80078125, 18.49365234375, 19.1865234375, 19.87939453125, 20.572265625, 21.26513671875, 21.9580078125, 22.65087890625, 23.34375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 24.0, 128.0, 354.0, 360.0, 130.0, 16.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.339313507080078, -6.671306610107422, -5.003299713134766, -3.3352928161621094, -1.6672859191894531, 0.000720977783203125, 1.6687278747558594, 3.3367347717285156, 5.004741668701172, 6.672748565673828, 8.340755462646484, 10.00876235961914, 11.676769256591797, 13.344776153564453, 15.01278305053711, 16.680789947509766, 18.348796844482422, 20.016803741455078, 21.684810638427734, 23.35281753540039, 25.020824432373047, 26.688831329345703, 28.35683822631836, 30.024845123291016, 31.692852020263672, 33.36085891723633, 35.028865814208984, 36.69687271118164, 38.3648796081543, 40.03288650512695, 41.70089340209961, 43.368900299072266, 45.03691101074219, 46.704917907714844, 48.3729248046875, 50.040931701660156, 51.70893859863281, 53.37694549560547, 55.044952392578125, 56.71295928955078, 58.38096618652344, 60.048973083496094, 61.71697998046875, 63.384986877441406, 65.05299377441406, 66.72100067138672, 68.38900756835938, 70.05701446533203, 71.72502136230469, 73.39302825927734, 75.06103515625, 76.72904205322266, 78.39704895019531, 80.06505584716797, 81.73306274414062, 83.40106964111328, 85.06907653808594, 86.7370834350586, 88.40509033203125, 90.0730972290039, 91.74110412597656, 93.40911102294922, 95.07711791992188, 96.74512481689453, 98.41313171386719]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 15.0, 11.0, 12.0, 14.0, 17.0, 15.0, 14.0, 24.0, 22.0, 23.0, 29.0, 35.0, 49.0, 49.0, 31.0, 34.0, 37.0, 40.0, 35.0, 41.0, 48.0, 38.0, 35.0, 36.0, 30.0, 32.0, 34.0, 20.0, 25.0, 21.0, 17.0, 17.0, 12.0, 11.0, 12.0, 12.0, 13.0, 12.0, 5.0, 6.0, 5.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.41712951660156, -36.2373046875, -35.05747604370117, -33.87765121459961, -32.69782257080078, -31.51799774169922, -30.338172912597656, -29.15834617614746, -27.978519439697266, -26.79869270324707, -25.618865966796875, -24.439041137695312, -23.259214401245117, -22.079387664794922, -20.89956283569336, -19.719736099243164, -18.53990936279297, -17.360082626342773, -16.180255889892578, -15.000431060791016, -13.82060432434082, -12.640777587890625, -11.460951805114746, -10.281126022338867, -9.101299285888672, -7.921473026275635, -6.741646766662598, -5.5618205070495605, -4.381994247436523, -3.2021679878234863, -2.022341728210449, -0.8425159454345703, 0.3373069763183594, 1.5171332359313965, 2.6969594955444336, 3.8767857551574707, 5.056612014770508, 6.236438274383545, 7.416264533996582, 8.596090316772461, 9.775917053222656, 10.955743789672852, 12.13556957244873, 13.31539535522461, 14.495222091674805, 15.675048828125, 16.854873657226562, 18.034700393676758, 19.214527130126953, 20.39435386657715, 21.574180603027344, 22.754005432128906, 23.9338321685791, 25.113658905029297, 26.29348373413086, 27.473310470581055, 28.65313720703125, 29.832963943481445, 31.01279067993164, 32.1926155090332, 33.37244415283203, 34.552268981933594, 35.732093811035156, 36.91191864013672, 38.09174728393555]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 8.0, 5.0, 6.0, 12.0, 8.0, 20.0, 13.0, 18.0, 25.0, 19.0, 25.0, 33.0, 35.0, 30.0, 44.0, 42.0, 41.0, 55.0, 46.0, 54.0, 48.0, 51.0, 28.0, 35.0, 34.0, 30.0, 31.0, 36.0, 21.0, 22.0, 23.0, 15.0, 15.0, 11.0, 13.0, 4.0, 12.0, 9.0, 2.0, 2.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.591796875, -3.4798583984375, -3.367919921875, -3.2559814453125, -3.14404296875, -3.0321044921875, -2.920166015625, -2.8082275390625, -2.6962890625, -2.5843505859375, -2.472412109375, -2.3604736328125, -2.24853515625, -2.1365966796875, -2.024658203125, -1.9127197265625, -1.80078125, -1.6888427734375, -1.576904296875, -1.4649658203125, -1.35302734375, -1.2410888671875, -1.129150390625, -1.0172119140625, -0.9052734375, -0.7933349609375, -0.681396484375, -0.5694580078125, -0.45751953125, -0.3455810546875, -0.233642578125, -0.1217041015625, -0.009765625, 0.1021728515625, 0.214111328125, 0.3260498046875, 0.43798828125, 0.5499267578125, 0.661865234375, 0.7738037109375, 0.8857421875, 0.9976806640625, 1.109619140625, 1.2215576171875, 1.33349609375, 1.4454345703125, 1.557373046875, 1.6693115234375, 1.78125, 1.8931884765625, 2.005126953125, 2.1170654296875, 2.22900390625, 2.3409423828125, 2.452880859375, 2.5648193359375, 2.6767578125, 2.7886962890625, 2.900634765625, 3.0125732421875, 3.12451171875, 3.2364501953125, 3.348388671875, 3.4603271484375, 3.572265625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 4.0, 10.0, 11.0, 10.0, 14.0, 19.0, 13.0, 35.0, 51.0, 45.0, 77.0, 131.0, 275.0, 614.0, 1533.0, 4248.0, 13649.0, 49486.0, 235269.0, 1249609.0, 1989961.0, 517880.0, 96544.0, 23778.0, 6924.0, 2316.0, 857.0, 387.0, 173.0, 94.0, 61.0, 44.0, 29.0, 23.0, 23.0, 17.0, 13.0, 7.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-7.41015625, -7.1871337890625, -6.964111328125, -6.7410888671875, -6.51806640625, -6.2950439453125, -6.072021484375, -5.8489990234375, -5.6259765625, -5.4029541015625, -5.179931640625, -4.9569091796875, -4.73388671875, -4.5108642578125, -4.287841796875, -4.0648193359375, -3.841796875, -3.6187744140625, -3.395751953125, -3.1727294921875, -2.94970703125, -2.7266845703125, -2.503662109375, -2.2806396484375, -2.0576171875, -1.8345947265625, -1.611572265625, -1.3885498046875, -1.16552734375, -0.9425048828125, -0.719482421875, -0.4964599609375, -0.2734375, -0.0504150390625, 0.172607421875, 0.3956298828125, 0.61865234375, 0.8416748046875, 1.064697265625, 1.2877197265625, 1.5107421875, 1.7337646484375, 1.956787109375, 2.1798095703125, 2.40283203125, 2.6258544921875, 2.848876953125, 3.0718994140625, 3.294921875, 3.5179443359375, 3.740966796875, 3.9639892578125, 4.18701171875, 4.4100341796875, 4.633056640625, 4.8560791015625, 5.0791015625, 5.3021240234375, 5.525146484375, 5.7481689453125, 5.97119140625, 6.1942138671875, 6.417236328125, 6.6402587890625, 6.86328125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 10.0, 8.0, 14.0, 19.0, 34.0, 57.0, 99.0, 153.0, 263.0, 411.0, 573.0, 696.0, 594.0, 421.0, 277.0, 176.0, 107.0, 71.0, 36.0, 29.0, 16.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0078125, -13.5494384765625, -13.091064453125, -12.6326904296875, -12.17431640625, -11.7159423828125, -11.257568359375, -10.7991943359375, -10.3408203125, -9.8824462890625, -9.424072265625, -8.9656982421875, -8.50732421875, -8.0489501953125, -7.590576171875, -7.1322021484375, -6.673828125, -6.2154541015625, -5.757080078125, -5.2987060546875, -4.84033203125, -4.3819580078125, -3.923583984375, -3.4652099609375, -3.0068359375, -2.5484619140625, -2.090087890625, -1.6317138671875, -1.17333984375, -0.7149658203125, -0.256591796875, 0.2017822265625, 0.66015625, 1.1185302734375, 1.576904296875, 2.0352783203125, 2.49365234375, 2.9520263671875, 3.410400390625, 3.8687744140625, 4.3271484375, 4.7855224609375, 5.243896484375, 5.7022705078125, 6.16064453125, 6.6190185546875, 7.077392578125, 7.5357666015625, 7.994140625, 8.4525146484375, 8.910888671875, 9.3692626953125, 9.82763671875, 10.2860107421875, 10.744384765625, 11.2027587890625, 11.6611328125, 12.1195068359375, 12.577880859375, 13.0362548828125, 13.49462890625, 13.9530029296875, 14.411376953125, 14.8697509765625, 15.328125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 6.0, 19.0, 28.0, 37.0, 80.0, 131.0, 314.0, 624.0, 2199.0, 17017.0, 427828.0, 3471873.0, 259122.0, 12025.0, 1840.0, 561.0, 271.0, 138.0, 73.0, 39.0, 30.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -32.51904296875, -31.6943359375, -30.86962890625, -30.044921875, -29.22021484375, -28.3955078125, -27.57080078125, -26.74609375, -25.92138671875, -25.0966796875, -24.27197265625, -23.447265625, -22.62255859375, -21.7978515625, -20.97314453125, -20.1484375, -19.32373046875, -18.4990234375, -17.67431640625, -16.849609375, -16.02490234375, -15.2001953125, -14.37548828125, -13.55078125, -12.72607421875, -11.9013671875, -11.07666015625, -10.251953125, -9.42724609375, -8.6025390625, -7.77783203125, -6.953125, -6.12841796875, -5.3037109375, -4.47900390625, -3.654296875, -2.82958984375, -2.0048828125, -1.18017578125, -0.35546875, 0.46923828125, 1.2939453125, 2.11865234375, 2.943359375, 3.76806640625, 4.5927734375, 5.41748046875, 6.2421875, 7.06689453125, 7.8916015625, 8.71630859375, 9.541015625, 10.36572265625, 11.1904296875, 12.01513671875, 12.83984375, 13.66455078125, 14.4892578125, 15.31396484375, 16.138671875, 16.96337890625, 17.7880859375, 18.61279296875, 19.4375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 16.0, 80.0, 192.0, 285.0, 246.0, 144.0, 45.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-200.8099822998047, -196.77439880371094, -192.73883056640625, -188.7032470703125, -184.6676788330078, -180.63209533691406, -176.59652709960938, -172.56094360351562, -168.52536010742188, -164.48977661132812, -160.45420837402344, -156.4186248779297, -152.383056640625, -148.34747314453125, -144.31190490722656, -140.2763214111328, -136.24075317382812, -132.20516967773438, -128.1696014404297, -124.13402557373047, -120.09844970703125, -116.0628662109375, -112.02729034423828, -107.99171447753906, -103.95613861083984, -99.92056274414062, -95.8849868774414, -91.84941101074219, -87.81382751464844, -83.77825927734375, -79.74267578125, -75.70709991455078, -71.6715087890625, -67.63593292236328, -63.60035705566406, -59.56477737426758, -55.52920150756836, -51.49362564086914, -47.458045959472656, -43.42247009277344, -39.386898040771484, -35.351322174072266, -31.315744400024414, -27.280166625976562, -23.244590759277344, -19.209014892578125, -15.173437118530273, -11.137859344482422, -7.102283477783203, -3.066706657409668, 0.9688701629638672, 5.004446983337402, 9.040023803710938, 13.075599670410156, 17.111177444458008, 21.14675521850586, 25.182331085205078, 29.217906951904297, 33.25348663330078, 37.2890625, 41.32463836669922, 45.36021423339844, 49.395790100097656, 53.43136978149414, 57.46694564819336]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 7.0, 6.0, 11.0, 20.0, 16.0, 17.0, 18.0, 21.0, 23.0, 27.0, 34.0, 29.0, 23.0, 47.0, 42.0, 28.0, 36.0, 41.0, 41.0, 42.0, 39.0, 36.0, 38.0, 29.0, 35.0, 41.0, 31.0, 20.0, 23.0, 26.0, 21.0, 25.0, 15.0, 20.0, 11.0, 8.0, 5.0, 7.0, 5.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.257848739624023, -30.298168182373047, -29.338489532470703, -28.378808975219727, -27.41912841796875, -26.459447860717773, -25.499767303466797, -24.540088653564453, -23.580408096313477, -22.6207275390625, -21.661048889160156, -20.70136833190918, -19.741687774658203, -18.782007217407227, -17.82232666015625, -16.862648010253906, -15.90296745300293, -14.943286895751953, -13.983607292175293, -13.023927688598633, -12.064247131347656, -11.10456657409668, -10.14488697052002, -9.18520736694336, -8.225526809692383, -7.2658467292785645, -6.306166648864746, -5.346486568450928, -4.386806488037109, -3.427126407623291, -2.4674463272094727, -1.5077662467956543, -0.5480842590332031, 0.41159582138061523, 1.3712759017944336, 2.330955982208252, 3.2906360626220703, 4.250316143035889, 5.209996223449707, 6.169676303863525, 7.129356384277344, 8.08903694152832, 9.04871654510498, 10.00839614868164, 10.968076705932617, 11.927757263183594, 12.887436866760254, 13.847116470336914, 14.80679702758789, 15.766477584838867, 16.726158142089844, 17.685836791992188, 18.645517349243164, 19.60519790649414, 20.564876556396484, 21.52455711364746, 22.484237670898438, 23.443918228149414, 24.40359878540039, 25.363277435302734, 26.32295799255371, 27.282638549804688, 28.24231719970703, 29.201997756958008, 30.161678314208984]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 0.0, 3.0, 10.0, 7.0, 4.0, 7.0, 17.0, 9.0, 15.0, 8.0, 18.0, 21.0, 15.0, 29.0, 29.0, 33.0, 28.0, 40.0, 35.0, 48.0, 44.0, 44.0, 52.0, 54.0, 30.0, 40.0, 38.0, 32.0, 34.0, 26.0, 32.0, 26.0, 27.0, 28.0, 21.0, 14.0, 13.0, 13.0, 10.0, 12.0, 2.0, 8.0, 5.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.501953125, -3.39495849609375, -3.2879638671875, -3.18096923828125, -3.073974609375, -2.96697998046875, -2.8599853515625, -2.75299072265625, -2.64599609375, -2.53900146484375, -2.4320068359375, -2.32501220703125, -2.218017578125, -2.11102294921875, -2.0040283203125, -1.89703369140625, -1.7900390625, -1.68304443359375, -1.5760498046875, -1.46905517578125, -1.362060546875, -1.25506591796875, -1.1480712890625, -1.04107666015625, -0.93408203125, -0.82708740234375, -0.7200927734375, -0.61309814453125, -0.506103515625, -0.39910888671875, -0.2921142578125, -0.18511962890625, -0.078125, 0.02886962890625, 0.1358642578125, 0.24285888671875, 0.349853515625, 0.45684814453125, 0.5638427734375, 0.67083740234375, 0.77783203125, 0.88482666015625, 0.9918212890625, 1.09881591796875, 1.205810546875, 1.31280517578125, 1.4197998046875, 1.52679443359375, 1.6337890625, 1.74078369140625, 1.8477783203125, 1.95477294921875, 2.061767578125, 2.16876220703125, 2.2757568359375, 2.38275146484375, 2.48974609375, 2.59674072265625, 2.7037353515625, 2.81072998046875, 2.917724609375, 3.02471923828125, 3.1317138671875, 3.23870849609375, 3.345703125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 20.0, 14.0, 29.0, 39.0, 52.0, 95.0, 148.0, 221.0, 404.0, 582.0, 895.0, 1463.0, 2526.0, 3995.0, 6577.0, 10588.0, 17263.0, 28523.0, 47270.0, 78990.0, 135476.0, 214812.0, 198055.0, 120544.0, 71397.0, 42419.0, 25533.0, 15619.0, 9640.0, 5898.0, 3635.0, 2195.0, 1405.0, 810.0, 516.0, 338.0, 193.0, 134.0, 67.0, 63.0, 36.0, 21.0, 11.0, 11.0, 7.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.309814453125, -0.3003959655761719, -0.29097747802734375, -0.2815589904785156, -0.2721405029296875, -0.2627220153808594, -0.25330352783203125, -0.24388504028320312, -0.234466552734375, -0.22504806518554688, -0.21562957763671875, -0.20621109008789062, -0.1967926025390625, -0.18737411499023438, -0.17795562744140625, -0.16853713989257812, -0.15911865234375, -0.14970016479492188, -0.14028167724609375, -0.13086318969726562, -0.1214447021484375, -0.11202621459960938, -0.10260772705078125, -0.09318923950195312, -0.083770751953125, -0.07435226440429688, -0.06493377685546875, -0.055515289306640625, -0.0460968017578125, -0.036678314208984375, -0.02725982666015625, -0.017841339111328125, -0.0084228515625, 0.000995635986328125, 0.01041412353515625, 0.019832611083984375, 0.0292510986328125, 0.038669586181640625, 0.04808807373046875, 0.057506561279296875, 0.066925048828125, 0.07634353637695312, 0.08576202392578125, 0.09518051147460938, 0.1045989990234375, 0.11401748657226562, 0.12343597412109375, 0.13285446166992188, 0.14227294921875, 0.15169143676757812, 0.16110992431640625, 0.17052841186523438, 0.1799468994140625, 0.18936538696289062, 0.19878387451171875, 0.20820236206054688, 0.217620849609375, 0.22703933715820312, 0.23645782470703125, 0.24587631225585938, 0.2552947998046875, 0.2647132873535156, 0.27413177490234375, 0.2835502624511719, 0.29296875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 6.0, 11.0, 7.0, 15.0, 9.0, 18.0, 27.0, 10.0, 22.0, 27.0, 24.0, 40.0, 40.0, 41.0, 54.0, 31.0, 50.0, 1073.0, 52.0, 47.0, 41.0, 48.0, 49.0, 35.0, 41.0, 34.0, 18.0, 28.0, 16.0, 16.0, 16.0, 10.0, 7.0, 15.0, 9.0, 9.0, 4.0, 3.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.927703857421875, -1.85345458984375, -1.779205322265625, -1.7049560546875, -1.630706787109375, -1.55645751953125, -1.482208251953125, -1.407958984375, -1.333709716796875, -1.25946044921875, -1.185211181640625, -1.1109619140625, -1.036712646484375, -0.96246337890625, -0.888214111328125, -0.81396484375, -0.739715576171875, -0.66546630859375, -0.591217041015625, -0.5169677734375, -0.442718505859375, -0.36846923828125, -0.294219970703125, -0.219970703125, -0.145721435546875, -0.07147216796875, 0.002777099609375, 0.0770263671875, 0.151275634765625, 0.22552490234375, 0.299774169921875, 0.3740234375, 0.448272705078125, 0.52252197265625, 0.596771240234375, 0.6710205078125, 0.745269775390625, 0.81951904296875, 0.893768310546875, 0.968017578125, 1.042266845703125, 1.11651611328125, 1.190765380859375, 1.2650146484375, 1.339263916015625, 1.41351318359375, 1.487762451171875, 1.56201171875, 1.636260986328125, 1.71051025390625, 1.784759521484375, 1.8590087890625, 1.933258056640625, 2.00750732421875, 2.081756591796875, 2.156005859375, 2.230255126953125, 2.30450439453125, 2.378753662109375, 2.4530029296875, 2.527252197265625, 2.60150146484375, 2.675750732421875, 2.75]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 10.0, 15.0, 15.0, 37.0, 55.0, 81.0, 125.0, 182.0, 306.0, 446.0, 689.0, 1128.0, 1810.0, 2710.0, 4267.0, 6320.0, 10160.0, 15631.0, 25329.0, 40981.0, 68678.0, 114083.0, 176186.0, 1249880.0, 146901.0, 89901.0, 53705.0, 32499.0, 19953.0, 12596.0, 8060.0, 5108.0, 3280.0, 2214.0, 1350.0, 880.0, 533.0, 364.0, 226.0, 168.0, 99.0, 54.0, 36.0, 37.0, 15.0, 11.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2325439453125, -0.22510528564453125, -0.2176666259765625, -0.21022796630859375, -0.202789306640625, -0.19535064697265625, -0.1879119873046875, -0.18047332763671875, -0.17303466796875, -0.16559600830078125, -0.1581573486328125, -0.15071868896484375, -0.143280029296875, -0.13584136962890625, -0.1284027099609375, -0.12096405029296875, -0.113525390625, -0.10608673095703125, -0.0986480712890625, -0.09120941162109375, -0.083770751953125, -0.07633209228515625, -0.0688934326171875, -0.06145477294921875, -0.05401611328125, -0.04657745361328125, -0.0391387939453125, -0.03170013427734375, -0.024261474609375, -0.01682281494140625, -0.0093841552734375, -0.00194549560546875, 0.0054931640625, 0.01293182373046875, 0.0203704833984375, 0.02780914306640625, 0.035247802734375, 0.04268646240234375, 0.0501251220703125, 0.05756378173828125, 0.06500244140625, 0.07244110107421875, 0.0798797607421875, 0.08731842041015625, 0.094757080078125, 0.10219573974609375, 0.1096343994140625, 0.11707305908203125, 0.12451171875, 0.13195037841796875, 0.1393890380859375, 0.14682769775390625, 0.154266357421875, 0.16170501708984375, 0.1691436767578125, 0.17658233642578125, 0.18402099609375, 0.19145965576171875, 0.1988983154296875, 0.20633697509765625, 0.213775634765625, 0.22121429443359375, 0.2286529541015625, 0.23609161376953125, 0.2435302734375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 5.0, 5.0, 10.0, 11.0, 10.0, 14.0, 20.0, 15.0, 25.0, 23.0, 32.0, 26.0, 34.0, 46.0, 63.0, 65.0, 43.0, 55.0, 55.0, 52.0, 47.0, 51.0, 46.0, 48.0, 25.0, 23.0, 31.0, 22.0, 18.0, 20.0, 13.0, 9.0, 7.0, 5.0, 4.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006999969482421875, -0.0006755143404006958, -0.0006510317325592041, -0.0006265491247177124, -0.0006020665168762207, -0.000577583909034729, -0.0005531013011932373, -0.0005286186933517456, -0.0005041360855102539, -0.0004796534776687622, -0.0004551708698272705, -0.0004306882619857788, -0.0004062056541442871, -0.0003817230463027954, -0.0003572404384613037, -0.000332757830619812, -0.0003082752227783203, -0.0002837926149368286, -0.0002593100070953369, -0.00023482739925384521, -0.00021034479141235352, -0.00018586218357086182, -0.00016137957572937012, -0.00013689696788787842, -0.00011241436004638672, -8.793175220489502e-05, -6.344914436340332e-05, -3.896653652191162e-05, -1.4483928680419922e-05, 9.998679161071777e-06, 3.4481287002563477e-05, 5.8963894844055176e-05, 8.344650268554688e-05, 0.00010792911052703857, 0.00013241171836853027, 0.00015689432621002197, 0.00018137693405151367, 0.00020585954189300537, 0.00023034214973449707, 0.00025482475757598877, 0.00027930736541748047, 0.00030378997325897217, 0.00032827258110046387, 0.00035275518894195557, 0.00037723779678344727, 0.00040172040462493896, 0.00042620301246643066, 0.00045068562030792236, 0.00047516822814941406, 0.0004996508359909058, 0.0005241334438323975, 0.0005486160516738892, 0.0005730986595153809, 0.0005975812673568726, 0.0006220638751983643, 0.000646546483039856, 0.0006710290908813477, 0.0006955116987228394, 0.0007199943065643311, 0.0007444769144058228, 0.0007689595222473145, 0.0007934421300888062, 0.0008179247379302979, 0.0008424073457717896, 0.0008668899536132812]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 8.0, 4.0, 10.0, 22.0, 25.0, 29.0, 24.0, 43.0, 41.0, 70.0, 90.0, 103.0, 141.0, 201.0, 229.0, 348.0, 723.0, 7438.0, 782059.0, 252528.0, 2568.0, 562.0, 320.0, 216.0, 151.0, 109.0, 100.0, 101.0, 69.0, 47.0, 26.0, 35.0, 29.0, 15.0, 21.0, 9.0, 7.0, 5.0, 7.0, 4.0, 2.0, 6.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.01459503173828125, -0.014198899269104004, -0.013802766799926758, -0.013406634330749512, -0.013010501861572266, -0.01261436939239502, -0.012218236923217773, -0.011822104454040527, -0.011425971984863281, -0.011029839515686035, -0.010633707046508789, -0.010237574577331543, -0.009841442108154297, -0.00944530963897705, -0.009049177169799805, -0.008653044700622559, -0.008256912231445312, -0.007860779762268066, -0.00746464729309082, -0.007068514823913574, -0.006672382354736328, -0.006276249885559082, -0.005880117416381836, -0.00548398494720459, -0.005087852478027344, -0.004691720008850098, -0.0042955875396728516, -0.0038994550704956055, -0.0035033226013183594, -0.0031071901321411133, -0.002711057662963867, -0.002314925193786621, -0.001918792724609375, -0.001522660255432129, -0.0011265277862548828, -0.0007303953170776367, -0.0003342628479003906, 6.186962127685547e-05, 0.00045800209045410156, 0.0008541345596313477, 0.0012502670288085938, 0.0016463994979858398, 0.002042531967163086, 0.002438664436340332, 0.002834796905517578, 0.0032309293746948242, 0.0036270618438720703, 0.004023194313049316, 0.0044193267822265625, 0.004815459251403809, 0.005211591720581055, 0.005607724189758301, 0.006003856658935547, 0.006399989128112793, 0.006796121597290039, 0.007192254066467285, 0.007588386535644531, 0.007984519004821777, 0.008380651473999023, 0.00877678394317627, 0.009172916412353516, 0.009569048881530762, 0.009965181350708008, 0.010361313819885254, 0.0107574462890625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 50.0, 178.0, 325.0, 307.0, 109.0, 25.0, 8.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013764874311164021, -0.0013186584692448378, -0.0012608295073732734, -0.001203000545501709, -0.0011451717000454664, -0.0010873426217585802, -0.0010295137763023376, -0.0009716848144307733, -0.0009138558525592089, -0.0008560268906876445, -0.0007981979288160801, -0.0007403690251521766, -0.0006825400632806122, -0.0006247111014090478, -0.0005668821977451444, -0.00050905323587358, -0.0004512242740020156, -0.0003933953121304512, -0.00033556637936271727, -0.00027773744659498334, -0.00021990848472341895, -0.00016207952285185456, -0.00010425059008412063, -4.64216573163867e-05, 1.1407304555177689e-05, 6.923625187482685e-05, 0.000127065199194476, 0.00018489414651412517, 0.00024272309383377433, 0.0003005520557053387, 0.00035838098847307265, 0.0004162099212408066, 0.0004740389995276928, 0.0005318679613992572, 0.0005896969232708216, 0.000647525826934725, 0.0007053547888062894, 0.0007631837506778538, 0.0008210126543417573, 0.0008788416162133217, 0.0009366705780848861, 0.0009944995399564505, 0.0010523285018280149, 0.0011101574636995792, 0.0011679863091558218, 0.001225815387442708, 0.0012836442328989506, 0.001341473194770515, 0.0013993021566420794, 0.0014571311185136437, 0.0015149600803852081, 0.0015727890422567725, 0.001630618004128337, 0.0016884468495845795, 0.0017462758114561439, 0.0018041047733277082, 0.0018619337351992726, 0.001919762697070837, 0.0019775915425270796, 0.002035420620813966, 0.0020932494662702084, 0.0021510785445570946, 0.002208907390013337, 0.0022667362354695797, 0.002324565313756466]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 12.0, 10.0, 15.0, 21.0, 28.0, 22.0, 32.0, 44.0, 41.0, 39.0, 35.0, 36.0, 39.0, 42.0, 46.0, 44.0, 37.0, 43.0, 41.0, 42.0, 35.0, 32.0, 34.0, 29.0, 31.0, 28.0, 22.0, 22.0, 13.0, 13.0, 16.0, 16.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004877448081970215, -0.00047342386096715927, -0.00045910291373729706, -0.00044478196650743484, -0.00043046101927757263, -0.0004161400720477104, -0.0004018191248178482, -0.000387498177587986, -0.0003731772303581238, -0.00035885628312826157, -0.00034453533589839935, -0.00033021438866853714, -0.0003158934414386749, -0.0003015724942088127, -0.0002872515469789505, -0.0002729305997490883, -0.0002586096525192261, -0.00024428870528936386, -0.00022996775805950165, -0.00021564681082963943, -0.00020132586359977722, -0.000187004916369915, -0.0001726839691400528, -0.00015836302191019058, -0.00014404207468032837, -0.00012972112745046616, -0.00011540018022060394, -0.00010107923299074173, -8.675828576087952e-05, -7.24373385310173e-05, -5.811639130115509e-05, -4.379544407129288e-05, -2.9474496841430664e-05, -1.5153549611568451e-05, -8.326023817062378e-07, 1.3488344848155975e-05, 2.780929207801819e-05, 4.21302393078804e-05, 5.6451186537742615e-05, 7.077213376760483e-05, 8.509308099746704e-05, 9.941402822732925e-05, 0.00011373497545719147, 0.00012805592268705368, 0.0001423768699169159, 0.0001566978171467781, 0.00017101876437664032, 0.00018533971160650253, 0.00019966065883636475, 0.00021398160606622696, 0.00022830255329608917, 0.00024262350052595139, 0.0002569444477558136, 0.0002712653949856758, 0.000285586342215538, 0.00029990728944540024, 0.00031422823667526245, 0.00032854918390512466, 0.0003428701311349869, 0.0003571910783648491, 0.0003715120255947113, 0.0003858329728245735, 0.00040015392005443573, 0.00041447486728429794, 0.00042879581451416016]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 0.0, 3.0, 10.0, 7.0, 4.0, 7.0, 17.0, 9.0, 15.0, 8.0, 18.0, 21.0, 15.0, 29.0, 29.0, 33.0, 28.0, 40.0, 35.0, 48.0, 44.0, 44.0, 52.0, 54.0, 30.0, 40.0, 38.0, 32.0, 34.0, 26.0, 32.0, 26.0, 27.0, 28.0, 21.0, 13.0, 14.0, 13.0, 10.0, 12.0, 2.0, 8.0, 5.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.501953125, -3.39495849609375, -3.2879638671875, -3.18096923828125, -3.073974609375, -2.96697998046875, -2.8599853515625, -2.75299072265625, -2.64599609375, -2.53900146484375, -2.4320068359375, -2.32501220703125, -2.218017578125, -2.11102294921875, -2.0040283203125, -1.89703369140625, -1.7900390625, -1.68304443359375, -1.5760498046875, -1.46905517578125, -1.362060546875, -1.25506591796875, -1.1480712890625, -1.04107666015625, -0.93408203125, -0.82708740234375, -0.7200927734375, -0.61309814453125, -0.506103515625, -0.39910888671875, -0.2921142578125, -0.18511962890625, -0.078125, 0.02886962890625, 0.1358642578125, 0.24285888671875, 0.349853515625, 0.45684814453125, 0.5638427734375, 0.67083740234375, 0.77783203125, 0.88482666015625, 0.9918212890625, 1.09881591796875, 1.205810546875, 1.31280517578125, 1.4197998046875, 1.52679443359375, 1.6337890625, 1.74078369140625, 1.8477783203125, 1.95477294921875, 2.061767578125, 2.16876220703125, 2.2757568359375, 2.38275146484375, 2.48974609375, 2.59674072265625, 2.7037353515625, 2.81072998046875, 2.917724609375, 3.02471923828125, 3.1317138671875, 3.23870849609375, 3.345703125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 7.0, 11.0, 15.0, 25.0, 35.0, 43.0, 66.0, 113.0, 119.0, 235.0, 351.0, 563.0, 960.0, 1601.0, 2644.0, 4752.0, 8418.0, 15738.0, 30462.0, 61101.0, 120977.0, 209728.0, 243148.0, 166556.0, 88055.0, 43728.0, 22154.0, 11604.0, 6351.0, 3558.0, 2003.0, 1290.0, 783.0, 473.0, 287.0, 198.0, 116.0, 78.0, 49.0, 38.0, 29.0, 23.0, 14.0, 9.0, 14.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.244140625, -2.16998291015625, -2.0958251953125, -2.02166748046875, -1.947509765625, -1.87335205078125, -1.7991943359375, -1.72503662109375, -1.65087890625, -1.57672119140625, -1.5025634765625, -1.42840576171875, -1.354248046875, -1.28009033203125, -1.2059326171875, -1.13177490234375, -1.0576171875, -0.98345947265625, -0.9093017578125, -0.83514404296875, -0.760986328125, -0.68682861328125, -0.6126708984375, -0.53851318359375, -0.46435546875, -0.39019775390625, -0.3160400390625, -0.24188232421875, -0.167724609375, -0.09356689453125, -0.0194091796875, 0.05474853515625, 0.12890625, 0.20306396484375, 0.2772216796875, 0.35137939453125, 0.425537109375, 0.49969482421875, 0.5738525390625, 0.64801025390625, 0.72216796875, 0.79632568359375, 0.8704833984375, 0.94464111328125, 1.018798828125, 1.09295654296875, 1.1671142578125, 1.24127197265625, 1.3154296875, 1.38958740234375, 1.4637451171875, 1.53790283203125, 1.612060546875, 1.68621826171875, 1.7603759765625, 1.83453369140625, 1.90869140625, 1.98284912109375, 2.0570068359375, 2.13116455078125, 2.205322265625, 2.27947998046875, 2.3536376953125, 2.42779541015625, 2.501953125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 16.0, 12.0, 7.0, 9.0, 17.0, 12.0, 15.0, 25.0, 16.0, 39.0, 26.0, 29.0, 44.0, 51.0, 44.0, 71.0, 169.0, 1517.0, 351.0, 132.0, 65.0, 40.0, 48.0, 42.0, 34.0, 30.0, 28.0, 21.0, 33.0, 24.0, 16.0, 19.0, 8.0, 6.0, 10.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.921875, -13.49853515625, -13.0751953125, -12.65185546875, -12.228515625, -11.80517578125, -11.3818359375, -10.95849609375, -10.53515625, -10.11181640625, -9.6884765625, -9.26513671875, -8.841796875, -8.41845703125, -7.9951171875, -7.57177734375, -7.1484375, -6.72509765625, -6.3017578125, -5.87841796875, -5.455078125, -5.03173828125, -4.6083984375, -4.18505859375, -3.76171875, -3.33837890625, -2.9150390625, -2.49169921875, -2.068359375, -1.64501953125, -1.2216796875, -0.79833984375, -0.375, 0.04833984375, 0.4716796875, 0.89501953125, 1.318359375, 1.74169921875, 2.1650390625, 2.58837890625, 3.01171875, 3.43505859375, 3.8583984375, 4.28173828125, 4.705078125, 5.12841796875, 5.5517578125, 5.97509765625, 6.3984375, 6.82177734375, 7.2451171875, 7.66845703125, 8.091796875, 8.51513671875, 8.9384765625, 9.36181640625, 9.78515625, 10.20849609375, 10.6318359375, 11.05517578125, 11.478515625, 11.90185546875, 12.3251953125, 12.74853515625, 13.171875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 7.0, 1.0, 5.0, 3.0, 7.0, 11.0, 12.0, 26.0, 20.0, 24.0, 36.0, 28.0, 43.0, 70.0, 64.0, 100.0, 149.0, 290.0, 546.0, 1880.0, 22509.0, 2461568.0, 646594.0, 9282.0, 1187.0, 451.0, 218.0, 148.0, 113.0, 62.0, 49.0, 42.0, 30.0, 20.0, 15.0, 11.0, 17.0, 10.0, 15.0, 14.0, 11.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.21875, -18.595947265625, -17.97314453125, -17.350341796875, -16.7275390625, -16.104736328125, -15.48193359375, -14.859130859375, -14.236328125, -13.613525390625, -12.99072265625, -12.367919921875, -11.7451171875, -11.122314453125, -10.49951171875, -9.876708984375, -9.25390625, -8.631103515625, -8.00830078125, -7.385498046875, -6.7626953125, -6.139892578125, -5.51708984375, -4.894287109375, -4.271484375, -3.648681640625, -3.02587890625, -2.403076171875, -1.7802734375, -1.157470703125, -0.53466796875, 0.088134765625, 0.7109375, 1.333740234375, 1.95654296875, 2.579345703125, 3.2021484375, 3.824951171875, 4.44775390625, 5.070556640625, 5.693359375, 6.316162109375, 6.93896484375, 7.561767578125, 8.1845703125, 8.807373046875, 9.43017578125, 10.052978515625, 10.67578125, 11.298583984375, 11.92138671875, 12.544189453125, 13.1669921875, 13.789794921875, 14.41259765625, 15.035400390625, 15.658203125, 16.281005859375, 16.90380859375, 17.526611328125, 18.1494140625, 18.772216796875, 19.39501953125, 20.017822265625, 20.640625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [3.0, 25.0, 181.0, 464.0, 299.0, 39.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.677033424377441, -6.325624465942383, -3.974215507507324, -1.6228065490722656, 0.728602409362793, 3.0800113677978516, 5.43142032623291, 7.782828330993652, 10.134238243103027, 12.485647201538086, 14.837056159973145, 17.188465118408203, 19.539875030517578, 21.89128303527832, 24.242691040039062, 26.594100952148438, 28.945510864257812, 31.296920776367188, 33.64833068847656, 35.99973678588867, 38.35114669799805, 40.70255661010742, 43.05396270751953, 45.405372619628906, 47.75678253173828, 50.108192443847656, 52.45960235595703, 54.81100845336914, 57.162418365478516, 59.51382827758789, 61.865234375, 64.21664428710938, 66.56805419921875, 68.91946411132812, 71.2708740234375, 73.62228393554688, 75.97369384765625, 78.3250961303711, 80.67650604248047, 83.02791595458984, 85.37932586669922, 87.7307357788086, 90.08214569091797, 92.43355560302734, 94.78495788574219, 97.13636779785156, 99.48777770996094, 101.83918762207031, 104.19059753417969, 106.54200744628906, 108.89341735839844, 111.24482727050781, 113.59623718261719, 115.94763946533203, 118.2990493774414, 120.65045928955078, 123.00186920166016, 125.35327911376953, 127.7046890258789, 130.05609130859375, 132.40750122070312, 134.7589111328125, 137.11032104492188, 139.46173095703125, 141.81314086914062]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 9.0, 13.0, 11.0, 11.0, 19.0, 20.0, 32.0, 22.0, 27.0, 41.0, 45.0, 39.0, 42.0, 47.0, 50.0, 44.0, 45.0, 35.0, 46.0, 39.0, 42.0, 36.0, 42.0, 36.0, 35.0, 23.0, 21.0, 24.0, 17.0, 19.0, 11.0, 11.0, 12.0, 13.0, 3.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.44906234741211, -41.07564926147461, -39.70223617553711, -38.32882308959961, -36.955413818359375, -35.582000732421875, -34.208587646484375, -32.835174560546875, -31.461761474609375, -30.088348388671875, -28.714935302734375, -27.341524124145508, -25.968111038208008, -24.594697952270508, -23.22128677368164, -21.84787368774414, -20.47446060180664, -19.10104751586914, -17.72763442993164, -16.354223251342773, -14.980810165405273, -13.607397079467773, -12.23398494720459, -10.860572814941406, -9.487159729003906, -8.113746643066406, -6.740334510803223, -5.366921901702881, -3.993509292602539, -2.6200966835021973, -1.2466840744018555, 0.12672805786132812, 1.5001449584960938, 2.8735575675964355, 4.246970176696777, 5.620382785797119, 6.993795394897461, 8.367208480834961, 9.740620613098145, 11.114032745361328, 12.487445831298828, 13.860858917236328, 15.234271049499512, 16.607683181762695, 17.981096267700195, 19.354509353637695, 20.727920532226562, 22.101333618164062, 23.474746704101562, 24.848159790039062, 26.221572875976562, 27.59498405456543, 28.96839714050293, 30.34181022644043, 31.715221405029297, 33.0886344909668, 34.4620475769043, 35.8354606628418, 37.2088737487793, 38.5822868347168, 39.95569610595703, 41.32910919189453, 42.70252227783203, 44.07593536376953, 45.44934844970703]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 4.0, 6.0, 6.0, 6.0, 10.0, 6.0, 11.0, 6.0, 11.0, 12.0, 17.0, 12.0, 29.0, 25.0, 24.0, 26.0, 32.0, 30.0, 52.0, 36.0, 38.0, 46.0, 41.0, 47.0, 41.0, 47.0, 37.0, 34.0, 36.0, 28.0, 27.0, 35.0, 23.0, 23.0, 23.0, 22.0, 17.0, 15.0, 5.0, 7.0, 13.0, 7.0, 6.0, 5.0, 4.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.66015625, -3.550079345703125, -3.44000244140625, -3.329925537109375, -3.2198486328125, -3.109771728515625, -2.99969482421875, -2.889617919921875, -2.779541015625, -2.669464111328125, -2.55938720703125, -2.449310302734375, -2.3392333984375, -2.229156494140625, -2.11907958984375, -2.009002685546875, -1.89892578125, -1.788848876953125, -1.67877197265625, -1.568695068359375, -1.4586181640625, -1.348541259765625, -1.23846435546875, -1.128387451171875, -1.018310546875, -0.908233642578125, -0.79815673828125, -0.688079833984375, -0.5780029296875, -0.467926025390625, -0.35784912109375, -0.247772216796875, -0.1376953125, -0.027618408203125, 0.08245849609375, 0.192535400390625, 0.3026123046875, 0.412689208984375, 0.52276611328125, 0.632843017578125, 0.742919921875, 0.852996826171875, 0.96307373046875, 1.073150634765625, 1.1832275390625, 1.293304443359375, 1.40338134765625, 1.513458251953125, 1.62353515625, 1.733612060546875, 1.84368896484375, 1.953765869140625, 2.0638427734375, 2.173919677734375, 2.28399658203125, 2.394073486328125, 2.504150390625, 2.614227294921875, 2.72430419921875, 2.834381103515625, 2.9444580078125, 3.054534912109375, 3.16461181640625, 3.274688720703125, 3.384765625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 7.0, 6.0, 6.0, 6.0, 12.0, 12.0, 12.0, 19.0, 18.0, 21.0, 33.0, 47.0, 77.0, 106.0, 191.0, 340.0, 744.0, 2228.0, 7932.0, 33319.0, 180995.0, 1151332.0, 2170498.0, 536932.0, 84929.0, 17521.0, 4367.0, 1386.0, 486.0, 235.0, 121.0, 93.0, 57.0, 41.0, 21.0, 18.0, 27.0, 7.0, 13.0, 13.0, 10.0, 5.0, 1.0, 14.0, 3.0, 4.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.6484375, -8.38861083984375, -8.1287841796875, -7.86895751953125, -7.609130859375, -7.34930419921875, -7.0894775390625, -6.82965087890625, -6.56982421875, -6.30999755859375, -6.0501708984375, -5.79034423828125, -5.530517578125, -5.27069091796875, -5.0108642578125, -4.75103759765625, -4.4912109375, -4.23138427734375, -3.9715576171875, -3.71173095703125, -3.451904296875, -3.19207763671875, -2.9322509765625, -2.67242431640625, -2.41259765625, -2.15277099609375, -1.8929443359375, -1.63311767578125, -1.373291015625, -1.11346435546875, -0.8536376953125, -0.59381103515625, -0.333984375, -0.07415771484375, 0.1856689453125, 0.44549560546875, 0.705322265625, 0.96514892578125, 1.2249755859375, 1.48480224609375, 1.74462890625, 2.00445556640625, 2.2642822265625, 2.52410888671875, 2.783935546875, 3.04376220703125, 3.3035888671875, 3.56341552734375, 3.8232421875, 4.08306884765625, 4.3428955078125, 4.60272216796875, 4.862548828125, 5.12237548828125, 5.3822021484375, 5.64202880859375, 5.90185546875, 6.16168212890625, 6.4215087890625, 6.68133544921875, 6.941162109375, 7.20098876953125, 7.4608154296875, 7.72064208984375, 7.98046875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 13.0, 18.0, 22.0, 22.0, 27.0, 52.0, 53.0, 77.0, 115.0, 152.0, 206.0, 252.0, 347.0, 444.0, 423.0, 409.0, 334.0, 286.0, 214.0, 155.0, 123.0, 98.0, 58.0, 54.0, 23.0, 23.0, 18.0, 7.0, 13.0, 4.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.4654541015625, -8.157470703125, -7.8494873046875, -7.54150390625, -7.2335205078125, -6.925537109375, -6.6175537109375, -6.3095703125, -6.0015869140625, -5.693603515625, -5.3856201171875, -5.07763671875, -4.7696533203125, -4.461669921875, -4.1536865234375, -3.845703125, -3.5377197265625, -3.229736328125, -2.9217529296875, -2.61376953125, -2.3057861328125, -1.997802734375, -1.6898193359375, -1.3818359375, -1.0738525390625, -0.765869140625, -0.4578857421875, -0.14990234375, 0.1580810546875, 0.466064453125, 0.7740478515625, 1.08203125, 1.3900146484375, 1.697998046875, 2.0059814453125, 2.31396484375, 2.6219482421875, 2.929931640625, 3.2379150390625, 3.5458984375, 3.8538818359375, 4.161865234375, 4.4698486328125, 4.77783203125, 5.0858154296875, 5.393798828125, 5.7017822265625, 6.009765625, 6.3177490234375, 6.625732421875, 6.9337158203125, 7.24169921875, 7.5496826171875, 7.857666015625, 8.1656494140625, 8.4736328125, 8.7816162109375, 9.089599609375, 9.3975830078125, 9.70556640625, 10.0135498046875, 10.321533203125, 10.6295166015625, 10.9375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 12.0, 11.0, 15.0, 15.0, 35.0, 29.0, 51.0, 38.0, 69.0, 92.0, 139.0, 194.0, 357.0, 722.0, 1803.0, 6800.0, 33747.0, 219756.0, 1556559.0, 2007388.0, 307990.0, 45637.0, 8523.0, 2255.0, 834.0, 409.0, 206.0, 163.0, 112.0, 75.0, 64.0, 38.0, 32.0, 22.0, 19.0, 14.0, 17.0, 11.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.65625, -14.199462890625, -13.74267578125, -13.285888671875, -12.8291015625, -12.372314453125, -11.91552734375, -11.458740234375, -11.001953125, -10.545166015625, -10.08837890625, -9.631591796875, -9.1748046875, -8.718017578125, -8.26123046875, -7.804443359375, -7.34765625, -6.890869140625, -6.43408203125, -5.977294921875, -5.5205078125, -5.063720703125, -4.60693359375, -4.150146484375, -3.693359375, -3.236572265625, -2.77978515625, -2.322998046875, -1.8662109375, -1.409423828125, -0.95263671875, -0.495849609375, -0.0390625, 0.417724609375, 0.87451171875, 1.331298828125, 1.7880859375, 2.244873046875, 2.70166015625, 3.158447265625, 3.615234375, 4.072021484375, 4.52880859375, 4.985595703125, 5.4423828125, 5.899169921875, 6.35595703125, 6.812744140625, 7.26953125, 7.726318359375, 8.18310546875, 8.639892578125, 9.0966796875, 9.553466796875, 10.01025390625, 10.467041015625, 10.923828125, 11.380615234375, 11.83740234375, 12.294189453125, 12.7509765625, 13.207763671875, 13.66455078125, 14.121337890625, 14.578125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 14.0, 19.0, 29.0, 69.0, 64.0, 90.0, 90.0, 107.0, 101.0, 115.0, 89.0, 84.0, 57.0, 31.0, 24.0, 11.0, 9.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.82568359375, -35.23188781738281, -33.63808822631836, -32.04429244995117, -30.45049476623535, -28.85669708251953, -27.26289939880371, -25.66910171508789, -24.075305938720703, -22.481508255004883, -20.887710571289062, -19.293914794921875, -17.700117111206055, -16.106319427490234, -14.512521743774414, -12.91872501373291, -11.324926376342773, -9.731128692626953, -8.13733196258545, -6.543534278869629, -4.949737071990967, -3.3559398651123047, -1.7621421813964844, -0.16834545135498047, 1.4254522323608398, 3.019249439239502, 4.613046646118164, 6.206844329833984, 7.8006415367126465, 9.394438743591309, 10.988236427307129, 12.582033157348633, 14.175830841064453, 15.769628524780273, 17.363426208496094, 18.95722198486328, 20.5510196685791, 22.144817352294922, 23.738615036010742, 25.332412719726562, 26.92620849609375, 28.52000617980957, 30.11380386352539, 31.707599639892578, 33.30139923095703, 34.89519500732422, 36.488990783691406, 38.08279037475586, 39.67658996582031, 41.2703857421875, 42.86418533325195, 44.45798110961914, 46.051780700683594, 47.64557647705078, 49.23937225341797, 50.83317184448242, 52.42696762084961, 54.0207633972168, 55.61456298828125, 57.20835876464844, 58.80215835571289, 60.39595413208008, 61.98975372314453, 63.58354949951172, 65.1773452758789]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 3.0, 7.0, 8.0, 7.0, 11.0, 8.0, 14.0, 19.0, 26.0, 19.0, 27.0, 25.0, 24.0, 30.0, 30.0, 27.0, 33.0, 45.0, 29.0, 35.0, 30.0, 42.0, 42.0, 35.0, 34.0, 35.0, 40.0, 33.0, 36.0, 30.0, 28.0, 17.0, 17.0, 21.0, 22.0, 19.0, 13.0, 13.0, 11.0, 9.0, 9.0, 7.0, 6.0, 3.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.311731338500977, -27.35302734375, -26.394325256347656, -25.435623168945312, -24.476919174194336, -23.51821517944336, -22.559513092041016, -21.600811004638672, -20.642107009887695, -19.68340301513672, -18.724700927734375, -17.76599884033203, -16.807294845581055, -15.848591804504395, -14.889888763427734, -13.931185722351074, -12.972482681274414, -12.013779640197754, -11.055076599121094, -10.096373558044434, -9.137670516967773, -8.178967475891113, -7.220264434814453, -6.261561393737793, -5.302858352661133, -4.344155311584473, -3.3854522705078125, -2.4267492294311523, -1.4680461883544922, -0.509343147277832, 0.4493598937988281, 1.4080629348754883, 2.3667678833007812, 3.3254709243774414, 4.284173965454102, 5.242877006530762, 6.201580047607422, 7.160283088684082, 8.118986129760742, 9.077689170837402, 10.036392211914062, 10.995095252990723, 11.953798294067383, 12.912501335144043, 13.871204376220703, 14.829907417297363, 15.788610458374023, 16.747314453125, 17.706016540527344, 18.664718627929688, 19.623422622680664, 20.58212661743164, 21.540828704833984, 22.499530792236328, 23.458234786987305, 24.41693878173828, 25.375640869140625, 26.33434295654297, 27.293046951293945, 28.251750946044922, 29.210453033447266, 30.16915512084961, 31.127859115600586, 32.08656311035156, 33.045265197753906]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 4.0, 8.0, 8.0, 12.0, 10.0, 15.0, 14.0, 20.0, 22.0, 29.0, 26.0, 32.0, 44.0, 48.0, 52.0, 54.0, 56.0, 47.0, 46.0, 56.0, 49.0, 29.0, 46.0, 45.0, 34.0, 29.0, 21.0, 20.0, 23.0, 19.0, 15.0, 9.0, 16.0, 9.0, 13.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.75390625, -4.6187744140625, -4.483642578125, -4.3485107421875, -4.21337890625, -4.0782470703125, -3.943115234375, -3.8079833984375, -3.6728515625, -3.5377197265625, -3.402587890625, -3.2674560546875, -3.13232421875, -2.9971923828125, -2.862060546875, -2.7269287109375, -2.591796875, -2.4566650390625, -2.321533203125, -2.1864013671875, -2.05126953125, -1.9161376953125, -1.781005859375, -1.6458740234375, -1.5107421875, -1.3756103515625, -1.240478515625, -1.1053466796875, -0.97021484375, -0.8350830078125, -0.699951171875, -0.5648193359375, -0.4296875, -0.2945556640625, -0.159423828125, -0.0242919921875, 0.11083984375, 0.2459716796875, 0.381103515625, 0.5162353515625, 0.6513671875, 0.7864990234375, 0.921630859375, 1.0567626953125, 1.19189453125, 1.3270263671875, 1.462158203125, 1.5972900390625, 1.732421875, 1.8675537109375, 2.002685546875, 2.1378173828125, 2.27294921875, 2.4080810546875, 2.543212890625, 2.6783447265625, 2.8134765625, 2.9486083984375, 3.083740234375, 3.2188720703125, 3.35400390625, 3.4891357421875, 3.624267578125, 3.7593994140625, 3.89453125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 9.0, 8.0, 18.0, 33.0, 41.0, 52.0, 93.0, 123.0, 179.0, 292.0, 454.0, 663.0, 1034.0, 1627.0, 2598.0, 4202.0, 6646.0, 10970.0, 17758.0, 29074.0, 47054.0, 76689.0, 126432.0, 196821.0, 197553.0, 126835.0, 77551.0, 47597.0, 29014.0, 17772.0, 10956.0, 6868.0, 4188.0, 2640.0, 1600.0, 1050.0, 734.0, 453.0, 291.0, 198.0, 118.0, 85.0, 54.0, 48.0, 21.0, 26.0, 15.0, 6.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.292236328125, -0.2824974060058594, -0.27275848388671875, -0.2630195617675781, -0.2532806396484375, -0.24354171752929688, -0.23380279541015625, -0.22406387329101562, -0.214324951171875, -0.20458602905273438, -0.19484710693359375, -0.18510818481445312, -0.1753692626953125, -0.16563034057617188, -0.15589141845703125, -0.14615249633789062, -0.13641357421875, -0.12667465209960938, -0.11693572998046875, -0.10719680786132812, -0.0974578857421875, -0.08771896362304688, -0.07798004150390625, -0.06824111938476562, -0.058502197265625, -0.048763275146484375, -0.03902435302734375, -0.029285430908203125, -0.0195465087890625, -0.009807586669921875, -6.866455078125e-05, 0.009670257568359375, 0.0194091796875, 0.029148101806640625, 0.03888702392578125, 0.048625946044921875, 0.0583648681640625, 0.06810379028320312, 0.07784271240234375, 0.08758163452148438, 0.097320556640625, 0.10705947875976562, 0.11679840087890625, 0.12653732299804688, 0.1362762451171875, 0.14601516723632812, 0.15575408935546875, 0.16549301147460938, 0.17523193359375, 0.18497085571289062, 0.19470977783203125, 0.20444869995117188, 0.2141876220703125, 0.22392654418945312, 0.23366546630859375, 0.24340438842773438, 0.253143310546875, 0.2628822326660156, 0.27262115478515625, 0.2823600769042969, 0.2920989990234375, 0.3018379211425781, 0.31157684326171875, 0.3213157653808594, 0.3310546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 2.0, 4.0, 17.0, 12.0, 10.0, 24.0, 11.0, 22.0, 22.0, 32.0, 27.0, 37.0, 34.0, 38.0, 55.0, 46.0, 46.0, 1077.0, 56.0, 41.0, 59.0, 43.0, 42.0, 37.0, 56.0, 35.0, 25.0, 18.0, 19.0, 12.0, 13.0, 16.0, 6.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.853515625, -2.76409912109375, -2.6746826171875, -2.58526611328125, -2.495849609375, -2.40643310546875, -2.3170166015625, -2.22760009765625, -2.13818359375, -2.04876708984375, -1.9593505859375, -1.86993408203125, -1.780517578125, -1.69110107421875, -1.6016845703125, -1.51226806640625, -1.4228515625, -1.33343505859375, -1.2440185546875, -1.15460205078125, -1.065185546875, -0.97576904296875, -0.8863525390625, -0.79693603515625, -0.70751953125, -0.61810302734375, -0.5286865234375, -0.43927001953125, -0.349853515625, -0.26043701171875, -0.1710205078125, -0.08160400390625, 0.0078125, 0.09722900390625, 0.1866455078125, 0.27606201171875, 0.365478515625, 0.45489501953125, 0.5443115234375, 0.63372802734375, 0.72314453125, 0.81256103515625, 0.9019775390625, 0.99139404296875, 1.080810546875, 1.17022705078125, 1.2596435546875, 1.34906005859375, 1.4384765625, 1.52789306640625, 1.6173095703125, 1.70672607421875, 1.796142578125, 1.88555908203125, 1.9749755859375, 2.06439208984375, 2.15380859375, 2.24322509765625, 2.3326416015625, 2.42205810546875, 2.511474609375, 2.60089111328125, 2.6903076171875, 2.77972412109375, 2.869140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 13.0, 14.0, 33.0, 42.0, 59.0, 90.0, 129.0, 246.0, 389.0, 695.0, 1117.0, 1959.0, 3285.0, 5361.0, 9378.0, 16020.0, 27574.0, 47281.0, 79982.0, 133710.0, 985607.0, 460114.0, 132258.0, 79660.0, 46303.0, 27102.0, 15781.0, 9369.0, 5610.0, 3230.0, 1861.0, 1114.0, 714.0, 378.0, 262.0, 157.0, 80.0, 59.0, 32.0, 25.0, 14.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.302490234375, -0.2935905456542969, -0.28469085693359375, -0.2757911682128906, -0.2668914794921875, -0.2579917907714844, -0.24909210205078125, -0.24019241333007812, -0.231292724609375, -0.22239303588867188, -0.21349334716796875, -0.20459365844726562, -0.1956939697265625, -0.18679428100585938, -0.17789459228515625, -0.16899490356445312, -0.16009521484375, -0.15119552612304688, -0.14229583740234375, -0.13339614868164062, -0.1244964599609375, -0.11559677124023438, -0.10669708251953125, -0.09779739379882812, -0.088897705078125, -0.07999801635742188, -0.07109832763671875, -0.062198638916015625, -0.0532989501953125, -0.044399261474609375, -0.03549957275390625, -0.026599884033203125, -0.0177001953125, -0.008800506591796875, 9.918212890625e-05, 0.008998870849609375, 0.0178985595703125, 0.026798248291015625, 0.03569793701171875, 0.044597625732421875, 0.053497314453125, 0.062397003173828125, 0.07129669189453125, 0.08019638061523438, 0.0890960693359375, 0.09799575805664062, 0.10689544677734375, 0.11579513549804688, 0.12469482421875, 0.13359451293945312, 0.14249420166015625, 0.15139389038085938, 0.1602935791015625, 0.16919326782226562, 0.17809295654296875, 0.18699264526367188, 0.195892333984375, 0.20479202270507812, 0.21369171142578125, 0.22259140014648438, 0.2314910888671875, 0.24039077758789062, 0.24929046630859375, 0.2581901550292969, 0.26708984375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 9.0, 4.0, 6.0, 10.0, 9.0, 16.0, 19.0, 20.0, 28.0, 45.0, 29.0, 53.0, 51.0, 79.0, 69.0, 64.0, 80.0, 70.0, 61.0, 58.0, 49.0, 38.0, 24.0, 20.0, 20.0, 13.0, 12.0, 8.0, 4.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0010089874267578125, -0.0009768903255462646, -0.0009447932243347168, -0.0009126961231231689, -0.0008805990219116211, -0.0008485019207000732, -0.0008164048194885254, -0.0007843077182769775, -0.0007522106170654297, -0.0007201135158538818, -0.000688016414642334, -0.0006559193134307861, -0.0006238222122192383, -0.0005917251110076904, -0.0005596280097961426, -0.0005275309085845947, -0.0004954338073730469, -0.000463336706161499, -0.00043123960494995117, -0.0003991425037384033, -0.00036704540252685547, -0.0003349483013153076, -0.00030285120010375977, -0.0002707540988922119, -0.00023865699768066406, -0.0002065598964691162, -0.00017446279525756836, -0.0001423656940460205, -0.00011026859283447266, -7.81714916229248e-05, -4.607439041137695e-05, -1.3977289199829102e-05, 1.811981201171875e-05, 5.02169132232666e-05, 8.231401443481445e-05, 0.0001144111156463623, 0.00014650821685791016, 0.000178605318069458, 0.00021070241928100586, 0.0002427995204925537, 0.00027489662170410156, 0.0003069937229156494, 0.00033909082412719727, 0.0003711879253387451, 0.00040328502655029297, 0.0004353821277618408, 0.00046747922897338867, 0.0004995763301849365, 0.0005316734313964844, 0.0005637705326080322, 0.0005958676338195801, 0.0006279647350311279, 0.0006600618362426758, 0.0006921589374542236, 0.0007242560386657715, 0.0007563531398773193, 0.0007884502410888672, 0.000820547342300415, 0.0008526444435119629, 0.0008847415447235107, 0.0009168386459350586, 0.0009489357471466064, 0.0009810328483581543, 0.0010131299495697021, 0.00104522705078125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 10.0, 6.0, 9.0, 11.0, 13.0, 13.0, 17.0, 33.0, 48.0, 67.0, 84.0, 117.0, 230.0, 317.0, 576.0, 4681.0, 957314.0, 82663.0, 1146.0, 431.0, 244.0, 155.0, 102.0, 66.0, 48.0, 42.0, 22.0, 24.0, 16.0, 11.0, 6.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0192108154296875, -0.018624067306518555, -0.01803731918334961, -0.017450571060180664, -0.01686382293701172, -0.016277074813842773, -0.015690326690673828, -0.015103578567504883, -0.014516830444335938, -0.013930082321166992, -0.013343334197998047, -0.012756586074829102, -0.012169837951660156, -0.011583089828491211, -0.010996341705322266, -0.01040959358215332, -0.009822845458984375, -0.00923609733581543, -0.008649349212646484, -0.008062601089477539, -0.007475852966308594, -0.0068891048431396484, -0.006302356719970703, -0.005715608596801758, -0.0051288604736328125, -0.004542112350463867, -0.003955364227294922, -0.0033686161041259766, -0.0027818679809570312, -0.002195119857788086, -0.0016083717346191406, -0.0010216236114501953, -0.00043487548828125, 0.0001518726348876953, 0.0007386207580566406, 0.001325368881225586, 0.0019121170043945312, 0.0024988651275634766, 0.003085613250732422, 0.003672361373901367, 0.0042591094970703125, 0.004845857620239258, 0.005432605743408203, 0.0060193538665771484, 0.006606101989746094, 0.007192850112915039, 0.007779598236083984, 0.00836634635925293, 0.008953094482421875, 0.00953984260559082, 0.010126590728759766, 0.010713338851928711, 0.011300086975097656, 0.011886835098266602, 0.012473583221435547, 0.013060331344604492, 0.013647079467773438, 0.014233827590942383, 0.014820575714111328, 0.015407323837280273, 0.01599407196044922, 0.016580820083618164, 0.01716756820678711, 0.017754316329956055, 0.018341064453125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 9.0, 11.0, 84.0, 157.0, 278.0, 254.0, 150.0, 49.0, 20.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00055880774743855, -0.0005075038061477244, -0.0004561998648568988, -0.0004048959235660732, -0.0003535919822752476, -0.0003022880700882524, -0.0002509841287974268, -0.00019968018750660121, -0.0001483762462157756, -9.707230492495e-05, -4.576837091008201e-05, 5.535563104785979e-06, 5.6839504395611584e-05, 0.00010814343113452196, 0.00015944737242534757, 0.00021075131371617317, 0.0002620552550069988, 0.0003133591962978244, 0.00036466313758865, 0.0004159670788794756, 0.0004672710201703012, 0.0005185749614611268, 0.0005698788445442915, 0.000621182844042778, 0.0006724867271259427, 0.0007237906684167683, 0.0007750946097075939, 0.0008263985509984195, 0.0008777024922892451, 0.0009290063753724098, 0.0009803103748708963, 0.001031614257954061, 0.0010829182574525476, 0.0011342221405357122, 0.0011855261400341988, 0.0012368300231173635, 0.00128813402261585, 0.0013394379056990147, 0.0013907419051975012, 0.0014420457882806659, 0.0014933497877791524, 0.001544653670862317, 0.0015959576703608036, 0.0016472615534439683, 0.0016985655529424548, 0.0017498694360256195, 0.001801173435524106, 0.0018524773186072707, 0.0019037812016904354, 0.001955085201188922, 0.002006388967856765, 0.0020576929673552513, 0.002108996966853738, 0.0021603009663522243, 0.002211604733020067, 0.0022629087325185537, 0.0023142127320170403, 0.0023655167315155268, 0.0024168204981833696, 0.002468124497681856, 0.0025194284971803427, 0.002570732496678829, 0.002622036263346672, 0.0026733402628451586, 0.002724644262343645]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 7.0, 8.0, 9.0, 9.0, 13.0, 10.0, 11.0, 16.0, 19.0, 29.0, 21.0, 28.0, 31.0, 34.0, 27.0, 26.0, 35.0, 35.0, 44.0, 49.0, 48.0, 38.0, 35.0, 38.0, 33.0, 27.0, 34.0, 28.0, 26.0, 27.0, 36.0, 25.0, 16.0, 11.0, 25.0, 13.0, 14.0, 11.0, 9.0, 6.0, 4.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00040781497955322266, -0.0003941114991903305, -0.00038040801882743835, -0.0003667045384645462, -0.00035300105810165405, -0.0003392975777387619, -0.00032559409737586975, -0.0003118906170129776, -0.00029818713665008545, -0.0002844836562871933, -0.00027078017592430115, -0.000257076695561409, -0.00024337321519851685, -0.0002296697348356247, -0.00021596625447273254, -0.0002022627741098404, -0.00018855929374694824, -0.0001748558133840561, -0.00016115233302116394, -0.0001474488526582718, -0.00013374537229537964, -0.00012004189193248749, -0.00010633841156959534, -9.263493120670319e-05, -7.893145084381104e-05, -6.522797048091888e-05, -5.1524490118026733e-05, -3.782100975513458e-05, -2.411752939224243e-05, -1.041404902935028e-05, 3.28943133354187e-06, 1.699291169643402e-05, 3.069639205932617e-05, 4.439987242221832e-05, 5.8103352785110474e-05, 7.180683314800262e-05, 8.551031351089478e-05, 9.921379387378693e-05, 0.00011291727423667908, 0.00012662075459957123, 0.00014032423496246338, 0.00015402771532535553, 0.00016773119568824768, 0.00018143467605113983, 0.00019513815641403198, 0.00020884163677692413, 0.00022254511713981628, 0.00023624859750270844, 0.0002499520778656006, 0.00026365555822849274, 0.0002773590385913849, 0.00029106251895427704, 0.0003047659993171692, 0.00031846947968006134, 0.0003321729600429535, 0.00034587644040584564, 0.0003595799207687378, 0.00037328340113162994, 0.0003869868814945221, 0.00040069036185741425, 0.0004143938422203064, 0.00042809732258319855, 0.0004418008029460907, 0.00045550428330898285, 0.000469207763671875]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 4.0, 8.0, 8.0, 12.0, 10.0, 15.0, 14.0, 20.0, 22.0, 29.0, 26.0, 32.0, 44.0, 48.0, 52.0, 54.0, 56.0, 47.0, 46.0, 56.0, 49.0, 29.0, 46.0, 45.0, 34.0, 29.0, 21.0, 20.0, 23.0, 19.0, 15.0, 9.0, 16.0, 9.0, 13.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.75390625, -4.6187744140625, -4.483642578125, -4.3485107421875, -4.21337890625, -4.0782470703125, -3.943115234375, -3.8079833984375, -3.6728515625, -3.5377197265625, -3.402587890625, -3.2674560546875, -3.13232421875, -2.9971923828125, -2.862060546875, -2.7269287109375, -2.591796875, -2.4566650390625, -2.321533203125, -2.1864013671875, -2.05126953125, -1.9161376953125, -1.781005859375, -1.6458740234375, -1.5107421875, -1.3756103515625, -1.240478515625, -1.1053466796875, -0.97021484375, -0.8350830078125, -0.699951171875, -0.5648193359375, -0.4296875, -0.2945556640625, -0.159423828125, -0.0242919921875, 0.11083984375, 0.2459716796875, 0.381103515625, 0.5162353515625, 0.6513671875, 0.7864990234375, 0.921630859375, 1.0567626953125, 1.19189453125, 1.3270263671875, 1.462158203125, 1.5972900390625, 1.732421875, 1.8675537109375, 2.002685546875, 2.1378173828125, 2.27294921875, 2.4080810546875, 2.543212890625, 2.6783447265625, 2.8134765625, 2.9486083984375, 3.083740234375, 3.2188720703125, 3.35400390625, 3.4891357421875, 3.624267578125, 3.7593994140625, 3.89453125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 7.0, 10.0, 14.0, 23.0, 28.0, 31.0, 43.0, 82.0, 110.0, 170.0, 270.0, 347.0, 619.0, 1038.0, 1755.0, 2781.0, 5004.0, 9307.0, 19715.0, 52129.0, 175957.0, 482648.0, 196299.0, 56438.0, 21064.0, 9692.0, 5298.0, 2993.0, 1773.0, 1028.0, 640.0, 437.0, 230.0, 176.0, 115.0, 77.0, 60.0, 38.0, 36.0, 19.0, 15.0, 9.0, 4.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.93450927734375, -4.7674560546875, -4.60040283203125, -4.433349609375, -4.26629638671875, -4.0992431640625, -3.93218994140625, -3.76513671875, -3.59808349609375, -3.4310302734375, -3.26397705078125, -3.096923828125, -2.92987060546875, -2.7628173828125, -2.59576416015625, -2.4287109375, -2.26165771484375, -2.0946044921875, -1.92755126953125, -1.760498046875, -1.59344482421875, -1.4263916015625, -1.25933837890625, -1.09228515625, -0.92523193359375, -0.7581787109375, -0.59112548828125, -0.424072265625, -0.25701904296875, -0.0899658203125, 0.07708740234375, 0.244140625, 0.41119384765625, 0.5782470703125, 0.74530029296875, 0.912353515625, 1.07940673828125, 1.2464599609375, 1.41351318359375, 1.58056640625, 1.74761962890625, 1.9146728515625, 2.08172607421875, 2.248779296875, 2.41583251953125, 2.5828857421875, 2.74993896484375, 2.9169921875, 3.08404541015625, 3.2510986328125, 3.41815185546875, 3.585205078125, 3.75225830078125, 3.9193115234375, 4.08636474609375, 4.25341796875, 4.42047119140625, 4.5875244140625, 4.75457763671875, 4.921630859375, 5.08868408203125, 5.2557373046875, 5.42279052734375, 5.58984375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 4.0, 4.0, 1.0, 4.0, 4.0, 7.0, 6.0, 7.0, 15.0, 9.0, 14.0, 16.0, 29.0, 28.0, 30.0, 24.0, 35.0, 35.0, 39.0, 39.0, 41.0, 59.0, 117.0, 241.0, 1483.0, 236.0, 104.0, 60.0, 44.0, 44.0, 33.0, 36.0, 24.0, 25.0, 17.0, 22.0, 22.0, 16.0, 10.0, 13.0, 9.0, 6.0, 11.0, 10.0, 3.0, 5.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4296875, -12.0352783203125, -11.640869140625, -11.2464599609375, -10.85205078125, -10.4576416015625, -10.063232421875, -9.6688232421875, -9.2744140625, -8.8800048828125, -8.485595703125, -8.0911865234375, -7.69677734375, -7.3023681640625, -6.907958984375, -6.5135498046875, -6.119140625, -5.7247314453125, -5.330322265625, -4.9359130859375, -4.54150390625, -4.1470947265625, -3.752685546875, -3.3582763671875, -2.9638671875, -2.5694580078125, -2.175048828125, -1.7806396484375, -1.38623046875, -0.9918212890625, -0.597412109375, -0.2030029296875, 0.19140625, 0.5858154296875, 0.980224609375, 1.3746337890625, 1.76904296875, 2.1634521484375, 2.557861328125, 2.9522705078125, 3.3466796875, 3.7410888671875, 4.135498046875, 4.5299072265625, 4.92431640625, 5.3187255859375, 5.713134765625, 6.1075439453125, 6.501953125, 6.8963623046875, 7.290771484375, 7.6851806640625, 8.07958984375, 8.4739990234375, 8.868408203125, 9.2628173828125, 9.6572265625, 10.0516357421875, 10.446044921875, 10.8404541015625, 11.23486328125, 11.6292724609375, 12.023681640625, 12.4180908203125, 12.8125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 9.0, 13.0, 11.0, 21.0, 29.0, 42.0, 84.0, 88.0, 187.0, 370.0, 1097.0, 21871.0, 3080128.0, 39310.0, 1415.0, 424.0, 224.0, 105.0, 91.0, 53.0, 23.0, 32.0, 22.0, 11.0, 10.0, 10.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.33642578125, -39.0166015625, -37.69677734375, -36.376953125, -35.05712890625, -33.7373046875, -32.41748046875, -31.09765625, -29.77783203125, -28.4580078125, -27.13818359375, -25.818359375, -24.49853515625, -23.1787109375, -21.85888671875, -20.5390625, -19.21923828125, -17.8994140625, -16.57958984375, -15.259765625, -13.93994140625, -12.6201171875, -11.30029296875, -9.98046875, -8.66064453125, -7.3408203125, -6.02099609375, -4.701171875, -3.38134765625, -2.0615234375, -0.74169921875, 0.578125, 1.89794921875, 3.2177734375, 4.53759765625, 5.857421875, 7.17724609375, 8.4970703125, 9.81689453125, 11.13671875, 12.45654296875, 13.7763671875, 15.09619140625, 16.416015625, 17.73583984375, 19.0556640625, 20.37548828125, 21.6953125, 23.01513671875, 24.3349609375, 25.65478515625, 26.974609375, 28.29443359375, 29.6142578125, 30.93408203125, 32.25390625, 33.57373046875, 34.8935546875, 36.21337890625, 37.533203125, 38.85302734375, 40.1728515625, 41.49267578125, 42.8125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 34.0, 203.0, 483.0, 249.0, 38.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.999847412109375, -27.16200828552246, -24.32417106628418, -21.486331939697266, -18.648494720458984, -15.81065559387207, -12.972816467285156, -10.134979248046875, -7.297140121459961, -4.459301948547363, -1.6214632987976074, 1.2163753509521484, 4.054213523864746, 6.892051696777344, 9.729890823364258, 12.567728042602539, 15.405567169189453, 18.243406295776367, 21.08124351501465, 23.919082641601562, 26.756919860839844, 29.594758987426758, 32.43259811401367, 35.27043533325195, 38.1082763671875, 40.94611358642578, 43.78395462036133, 46.62179183959961, 49.45962905883789, 52.29747009277344, 55.13530731201172, 57.97314453125, 60.81098175048828, 63.64881896972656, 66.48665618896484, 69.32449340820312, 72.16233825683594, 75.00017547607422, 77.8380126953125, 80.67584991455078, 83.51368713378906, 86.35152435302734, 89.18936157226562, 92.02720642089844, 94.86504364013672, 97.702880859375, 100.54071807861328, 103.37855529785156, 106.21640014648438, 109.05423736572266, 111.89207458496094, 114.72991943359375, 117.56775665283203, 120.40559387207031, 123.2434310913086, 126.08126831054688, 128.91909790039062, 131.75694274902344, 134.5947723388672, 137.4326171875, 140.27044677734375, 143.10829162597656, 145.94613647460938, 148.78396606445312, 151.62181091308594]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 5.0, 5.0, 8.0, 8.0, 18.0, 17.0, 25.0, 29.0, 32.0, 22.0, 25.0, 30.0, 35.0, 45.0, 32.0, 40.0, 50.0, 51.0, 48.0, 38.0, 49.0, 35.0, 36.0, 45.0, 28.0, 27.0, 27.0, 32.0, 24.0, 18.0, 12.0, 17.0, 14.0, 16.0, 5.0, 15.0, 6.0, 11.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.61349105834961, -39.28224563598633, -37.95100021362305, -36.619754791259766, -35.28851318359375, -33.95726776123047, -32.62602233886719, -31.294776916503906, -29.963531494140625, -28.632286071777344, -27.301040649414062, -25.969797134399414, -24.638551712036133, -23.30730628967285, -21.976062774658203, -20.644817352294922, -19.31357192993164, -17.98232650756836, -16.651081085205078, -15.31983757019043, -13.988592147827148, -12.657346725463867, -11.326102256774902, -9.994857788085938, -8.663612365722656, -7.332367420196533, -6.00112247467041, -4.669877529144287, -3.338632583618164, -2.007387638092041, -0.676142692565918, 0.6551017761230469, 1.9863471984863281, 3.317592144012451, 4.648837089538574, 5.980082035064697, 7.31132698059082, 8.642572402954102, 9.973816871643066, 11.305061340332031, 12.636306762695312, 13.967552185058594, 15.298796653747559, 16.630041122436523, 17.961286544799805, 19.292531967163086, 20.623775482177734, 21.955020904541016, 23.286266326904297, 24.617511749267578, 25.94875717163086, 27.280000686645508, 28.61124610900879, 29.94249153137207, 31.27373504638672, 32.60498046875, 33.93622589111328, 35.26747131347656, 36.598716735839844, 37.929962158203125, 39.261207580566406, 40.59244918823242, 41.9236946105957, 43.254940032958984, 44.586185455322266]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 13.0, 14.0, 10.0, 14.0, 8.0, 18.0, 23.0, 28.0, 29.0, 27.0, 43.0, 42.0, 40.0, 48.0, 58.0, 48.0, 65.0, 52.0, 39.0, 33.0, 43.0, 35.0, 36.0, 31.0, 35.0, 21.0, 28.0, 15.0, 7.0, 16.0, 15.0, 11.0, 11.0, 7.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.95703125, -4.821258544921875, -4.68548583984375, -4.549713134765625, -4.4139404296875, -4.278167724609375, -4.14239501953125, -4.006622314453125, -3.870849609375, -3.735076904296875, -3.59930419921875, -3.463531494140625, -3.3277587890625, -3.191986083984375, -3.05621337890625, -2.920440673828125, -2.78466796875, -2.648895263671875, -2.51312255859375, -2.377349853515625, -2.2415771484375, -2.105804443359375, -1.97003173828125, -1.834259033203125, -1.698486328125, -1.562713623046875, -1.42694091796875, -1.291168212890625, -1.1553955078125, -1.019622802734375, -0.88385009765625, -0.748077392578125, -0.6123046875, -0.476531982421875, -0.34075927734375, -0.204986572265625, -0.0692138671875, 0.066558837890625, 0.20233154296875, 0.338104248046875, 0.473876953125, 0.609649658203125, 0.74542236328125, 0.881195068359375, 1.0169677734375, 1.152740478515625, 1.28851318359375, 1.424285888671875, 1.56005859375, 1.695831298828125, 1.83160400390625, 1.967376708984375, 2.1031494140625, 2.238922119140625, 2.37469482421875, 2.510467529296875, 2.646240234375, 2.782012939453125, 2.91778564453125, 3.053558349609375, 3.1893310546875, 3.325103759765625, 3.46087646484375, 3.596649169921875, 3.732421875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 6.0, 6.0, 6.0, 9.0, 7.0, 15.0, 12.0, 21.0, 29.0, 39.0, 78.0, 109.0, 202.0, 326.0, 494.0, 960.0, 1897.0, 4073.0, 8979.0, 21767.0, 56781.0, 162458.0, 479182.0, 1133850.0, 1328034.0, 642997.0, 224326.0, 77371.0, 28866.0, 11491.0, 4908.0, 2343.0, 1104.0, 586.0, 357.0, 180.0, 147.0, 85.0, 51.0, 38.0, 29.0, 18.0, 9.0, 12.0, 12.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.27734375, -5.122802734375, -4.96826171875, -4.813720703125, -4.6591796875, -4.504638671875, -4.35009765625, -4.195556640625, -4.041015625, -3.886474609375, -3.73193359375, -3.577392578125, -3.4228515625, -3.268310546875, -3.11376953125, -2.959228515625, -2.8046875, -2.650146484375, -2.49560546875, -2.341064453125, -2.1865234375, -2.031982421875, -1.87744140625, -1.722900390625, -1.568359375, -1.413818359375, -1.25927734375, -1.104736328125, -0.9501953125, -0.795654296875, -0.64111328125, -0.486572265625, -0.33203125, -0.177490234375, -0.02294921875, 0.131591796875, 0.2861328125, 0.440673828125, 0.59521484375, 0.749755859375, 0.904296875, 1.058837890625, 1.21337890625, 1.367919921875, 1.5224609375, 1.677001953125, 1.83154296875, 1.986083984375, 2.140625, 2.295166015625, 2.44970703125, 2.604248046875, 2.7587890625, 2.913330078125, 3.06787109375, 3.222412109375, 3.376953125, 3.531494140625, 3.68603515625, 3.840576171875, 3.9951171875, 4.149658203125, 4.30419921875, 4.458740234375, 4.61328125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 2.0, 3.0, 14.0, 16.0, 14.0, 24.0, 35.0, 43.0, 85.0, 119.0, 188.0, 271.0, 336.0, 429.0, 527.0, 480.0, 418.0, 317.0, 218.0, 156.0, 134.0, 76.0, 59.0, 36.0, 27.0, 19.0, 12.0, 10.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.796875, -13.412353515625, -13.02783203125, -12.643310546875, -12.2587890625, -11.874267578125, -11.48974609375, -11.105224609375, -10.720703125, -10.336181640625, -9.95166015625, -9.567138671875, -9.1826171875, -8.798095703125, -8.41357421875, -8.029052734375, -7.64453125, -7.260009765625, -6.87548828125, -6.490966796875, -6.1064453125, -5.721923828125, -5.33740234375, -4.952880859375, -4.568359375, -4.183837890625, -3.79931640625, -3.414794921875, -3.0302734375, -2.645751953125, -2.26123046875, -1.876708984375, -1.4921875, -1.107666015625, -0.72314453125, -0.338623046875, 0.0458984375, 0.430419921875, 0.81494140625, 1.199462890625, 1.583984375, 1.968505859375, 2.35302734375, 2.737548828125, 3.1220703125, 3.506591796875, 3.89111328125, 4.275634765625, 4.66015625, 5.044677734375, 5.42919921875, 5.813720703125, 6.1982421875, 6.582763671875, 6.96728515625, 7.351806640625, 7.736328125, 8.120849609375, 8.50537109375, 8.889892578125, 9.2744140625, 9.658935546875, 10.04345703125, 10.427978515625, 10.8125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 3.0, 8.0, 11.0, 12.0, 20.0, 31.0, 50.0, 85.0, 100.0, 189.0, 409.0, 910.0, 3111.0, 17972.0, 183782.0, 2107792.0, 1719529.0, 141299.0, 14619.0, 2642.0, 831.0, 351.0, 175.0, 97.0, 74.0, 48.0, 47.0, 22.0, 19.0, 14.0, 6.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.53515625, -12.9453125, -12.35546875, -11.765625, -11.17578125, -10.5859375, -9.99609375, -9.40625, -8.81640625, -8.2265625, -7.63671875, -7.046875, -6.45703125, -5.8671875, -5.27734375, -4.6875, -4.09765625, -3.5078125, -2.91796875, -2.328125, -1.73828125, -1.1484375, -0.55859375, 0.03125, 0.62109375, 1.2109375, 1.80078125, 2.390625, 2.98046875, 3.5703125, 4.16015625, 4.75, 5.33984375, 5.9296875, 6.51953125, 7.109375, 7.69921875, 8.2890625, 8.87890625, 9.46875, 10.05859375, 10.6484375, 11.23828125, 11.828125, 12.41796875, 13.0078125, 13.59765625, 14.1875, 14.77734375, 15.3671875, 15.95703125, 16.546875, 17.13671875, 17.7265625, 18.31640625, 18.90625, 19.49609375, 20.0859375, 20.67578125, 21.265625, 21.85546875, 22.4453125, 23.03515625, 23.625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 20.0, 34.0, 69.0, 173.0, 202.0, 202.0, 143.0, 91.0, 48.0, 14.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.42080688476562, -139.45489501953125, -136.48898315429688, -133.52308654785156, -130.5571746826172, -127.59126281738281, -124.62535095214844, -121.6594467163086, -118.69354248046875, -115.72763061523438, -112.76172637939453, -109.79581451416016, -106.82991027832031, -103.86399841308594, -100.89808654785156, -97.93218231201172, -94.96627044677734, -92.00035858154297, -89.03445434570312, -86.06854248046875, -83.1026382446289, -80.13672637939453, -77.17082214355469, -74.20491027832031, -71.23899841308594, -68.27308654785156, -65.30718231201172, -62.341270446777344, -59.3753662109375, -56.409454345703125, -53.443546295166016, -50.477638244628906, -47.51172637939453, -44.54581832885742, -41.57991027832031, -38.61399841308594, -35.648094177246094, -32.68218231201172, -29.71627426147461, -26.7503662109375, -23.78445816040039, -20.81855010986328, -17.852642059326172, -14.88673210144043, -11.92082405090332, -8.954916000366211, -5.989006042480469, -3.0230979919433594, -0.05718994140625, 2.9087185859680176, 5.874627113342285, 8.840536117553711, 11.80644416809082, 14.77235221862793, 17.738262176513672, 20.70417022705078, 23.67007827758789, 26.635986328125, 29.60189437866211, 32.56780242919922, 35.533714294433594, 38.49961853027344, 41.46553039550781, 44.43143844604492, 47.39734649658203]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 9.0, 4.0, 8.0, 5.0, 13.0, 11.0, 10.0, 18.0, 17.0, 11.0, 26.0, 16.0, 26.0, 32.0, 37.0, 32.0, 37.0, 26.0, 36.0, 34.0, 47.0, 41.0, 42.0, 34.0, 39.0, 41.0, 40.0, 34.0, 36.0, 26.0, 25.0, 30.0, 21.0, 23.0, 20.0, 13.0, 16.0, 14.0, 11.0, 7.0, 9.0, 6.0, 6.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-35.398033142089844, -34.387638092041016, -33.37724685668945, -32.366851806640625, -31.35645866394043, -30.346065521240234, -29.335670471191406, -28.32527732849121, -27.314884185791016, -26.30449104309082, -25.294095993041992, -24.283702850341797, -23.2733097076416, -22.262916564941406, -21.252521514892578, -20.242128372192383, -19.231733322143555, -18.22134017944336, -17.21094512939453, -16.200551986694336, -15.19015884399414, -14.179764747619629, -13.169370651245117, -12.158977508544922, -11.14858341217041, -10.138189315795898, -9.127796173095703, -8.117402076721191, -7.107008457183838, -6.096614837646484, -5.086220741271973, -4.075827121734619, -3.065431594848633, -2.0550379753112793, -1.0446441173553467, -0.03425025939941406, 0.9761433601379395, 1.986536979675293, 2.9969310760498047, 4.007324695587158, 5.017718315124512, 6.028111934661865, 7.038505554199219, 8.04889965057373, 9.059293746948242, 10.069686889648438, 11.08008098602295, 12.090475082397461, 13.100868225097656, 14.111262321472168, 15.121655464172363, 16.132049560546875, 17.14244270324707, 18.152835845947266, 19.163230895996094, 20.17362403869629, 21.184017181396484, 22.19441032409668, 23.204805374145508, 24.215198516845703, 25.2255916595459, 26.235984802246094, 27.246379852294922, 28.256772994995117, 29.267168045043945]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 4.0, 6.0, 8.0, 9.0, 9.0, 7.0, 12.0, 19.0, 18.0, 28.0, 21.0, 27.0, 32.0, 45.0, 52.0, 55.0, 44.0, 61.0, 53.0, 35.0, 46.0, 50.0, 44.0, 44.0, 37.0, 34.0, 26.0, 26.0, 34.0, 20.0, 18.0, 16.0, 17.0, 8.0, 11.0, 7.0, 5.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.91796875, -4.76983642578125, -4.6217041015625, -4.47357177734375, -4.325439453125, -4.17730712890625, -4.0291748046875, -3.88104248046875, -3.73291015625, -3.58477783203125, -3.4366455078125, -3.28851318359375, -3.140380859375, -2.99224853515625, -2.8441162109375, -2.69598388671875, -2.5478515625, -2.39971923828125, -2.2515869140625, -2.10345458984375, -1.955322265625, -1.80718994140625, -1.6590576171875, -1.51092529296875, -1.36279296875, -1.21466064453125, -1.0665283203125, -0.91839599609375, -0.770263671875, -0.62213134765625, -0.4739990234375, -0.32586669921875, -0.177734375, -0.02960205078125, 0.1185302734375, 0.26666259765625, 0.414794921875, 0.56292724609375, 0.7110595703125, 0.85919189453125, 1.00732421875, 1.15545654296875, 1.3035888671875, 1.45172119140625, 1.599853515625, 1.74798583984375, 1.8961181640625, 2.04425048828125, 2.1923828125, 2.34051513671875, 2.4886474609375, 2.63677978515625, 2.784912109375, 2.93304443359375, 3.0811767578125, 3.22930908203125, 3.37744140625, 3.52557373046875, 3.6737060546875, 3.82183837890625, 3.969970703125, 4.11810302734375, 4.2662353515625, 4.41436767578125, 4.5625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 11.0, 6.0, 19.0, 30.0, 27.0, 40.0, 98.0, 134.0, 179.0, 297.0, 352.0, 565.0, 852.0, 1328.0, 1994.0, 3006.0, 4775.0, 7013.0, 10985.0, 16761.0, 25519.0, 39749.0, 61459.0, 95757.0, 145301.0, 188228.0, 154372.0, 102282.0, 65464.0, 42605.0, 27700.0, 17924.0, 11650.0, 7446.0, 4963.0, 3210.0, 2096.0, 1437.0, 962.0, 611.0, 457.0, 314.0, 177.0, 130.0, 88.0, 51.0, 41.0, 27.0, 25.0, 16.0, 9.0, 7.0, 6.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.322998046875, -0.3130836486816406, -0.30316925048828125, -0.2932548522949219, -0.2833404541015625, -0.2734260559082031, -0.26351165771484375, -0.2535972595214844, -0.243682861328125, -0.23376846313476562, -0.22385406494140625, -0.21393966674804688, -0.2040252685546875, -0.19411087036132812, -0.18419647216796875, -0.17428207397460938, -0.16436767578125, -0.15445327758789062, -0.14453887939453125, -0.13462448120117188, -0.1247100830078125, -0.11479568481445312, -0.10488128662109375, -0.09496688842773438, -0.085052490234375, -0.07513809204101562, -0.06522369384765625, -0.055309295654296875, -0.0453948974609375, -0.035480499267578125, -0.02556610107421875, -0.015651702880859375, -0.0057373046875, 0.004177093505859375, 0.01409149169921875, 0.024005889892578125, 0.0339202880859375, 0.043834686279296875, 0.05374908447265625, 0.06366348266601562, 0.073577880859375, 0.08349227905273438, 0.09340667724609375, 0.10332107543945312, 0.1132354736328125, 0.12314987182617188, 0.13306427001953125, 0.14297866821289062, 0.15289306640625, 0.16280746459960938, 0.17272186279296875, 0.18263626098632812, 0.1925506591796875, 0.20246505737304688, 0.21237945556640625, 0.22229385375976562, 0.232208251953125, 0.24212265014648438, 0.25203704833984375, 0.2619514465332031, 0.2718658447265625, 0.2817802429199219, 0.29169464111328125, 0.3016090393066406, 0.3115234375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 3.0, 3.0, 1.0, 5.0, 2.0, 13.0, 4.0, 8.0, 8.0, 21.0, 14.0, 15.0, 22.0, 14.0, 20.0, 24.0, 29.0, 32.0, 32.0, 24.0, 33.0, 31.0, 42.0, 37.0, 30.0, 1052.0, 33.0, 35.0, 37.0, 30.0, 36.0, 39.0, 30.0, 36.0, 32.0, 29.0, 25.0, 20.0, 22.0, 13.0, 20.0, 11.0, 12.0, 4.0, 10.0, 12.0, 9.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0859375, -2.01300048828125, -1.9400634765625, -1.86712646484375, -1.794189453125, -1.72125244140625, -1.6483154296875, -1.57537841796875, -1.50244140625, -1.42950439453125, -1.3565673828125, -1.28363037109375, -1.210693359375, -1.13775634765625, -1.0648193359375, -0.99188232421875, -0.9189453125, -0.84600830078125, -0.7730712890625, -0.70013427734375, -0.627197265625, -0.55426025390625, -0.4813232421875, -0.40838623046875, -0.33544921875, -0.26251220703125, -0.1895751953125, -0.11663818359375, -0.043701171875, 0.02923583984375, 0.1021728515625, 0.17510986328125, 0.248046875, 0.32098388671875, 0.3939208984375, 0.46685791015625, 0.539794921875, 0.61273193359375, 0.6856689453125, 0.75860595703125, 0.83154296875, 0.90447998046875, 0.9774169921875, 1.05035400390625, 1.123291015625, 1.19622802734375, 1.2691650390625, 1.34210205078125, 1.4150390625, 1.48797607421875, 1.5609130859375, 1.63385009765625, 1.706787109375, 1.77972412109375, 1.8526611328125, 1.92559814453125, 1.99853515625, 2.07147216796875, 2.1444091796875, 2.21734619140625, 2.290283203125, 2.36322021484375, 2.4361572265625, 2.50909423828125, 2.58203125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 11.0, 7.0, 18.0, 15.0, 38.0, 67.0, 97.0, 172.0, 266.0, 458.0, 678.0, 1228.0, 2072.0, 3382.0, 5683.0, 9084.0, 14783.0, 24079.0, 39760.0, 63939.0, 102794.0, 157470.0, 1243385.0, 157992.0, 103248.0, 64586.0, 39316.0, 24139.0, 14876.0, 9296.0, 5633.0, 3398.0, 2110.0, 1242.0, 690.0, 419.0, 274.0, 168.0, 103.0, 55.0, 33.0, 29.0, 16.0, 11.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269775390625, -0.2606315612792969, -0.25148773193359375, -0.24234390258789062, -0.2332000732421875, -0.22405624389648438, -0.21491241455078125, -0.20576858520507812, -0.196624755859375, -0.18748092651367188, -0.17833709716796875, -0.16919326782226562, -0.1600494384765625, -0.15090560913085938, -0.14176177978515625, -0.13261795043945312, -0.12347412109375, -0.11433029174804688, -0.10518646240234375, -0.09604263305664062, -0.0868988037109375, -0.07775497436523438, -0.06861114501953125, -0.059467315673828125, -0.050323486328125, -0.041179656982421875, -0.03203582763671875, -0.022891998291015625, -0.0137481689453125, -0.004604339599609375, 0.00453948974609375, 0.013683319091796875, 0.0228271484375, 0.031970977783203125, 0.04111480712890625, 0.050258636474609375, 0.0594024658203125, 0.06854629516601562, 0.07769012451171875, 0.08683395385742188, 0.095977783203125, 0.10512161254882812, 0.11426544189453125, 0.12340927124023438, 0.1325531005859375, 0.14169692993164062, 0.15084075927734375, 0.15998458862304688, 0.16912841796875, 0.17827224731445312, 0.18741607666015625, 0.19655990600585938, 0.2057037353515625, 0.21484756469726562, 0.22399139404296875, 0.23313522338867188, 0.242279052734375, 0.2514228820800781, 0.26056671142578125, 0.2697105407714844, 0.2788543701171875, 0.2879981994628906, 0.29714202880859375, 0.3062858581542969, 0.3154296875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 3.0, 7.0, 12.0, 23.0, 28.0, 26.0, 40.0, 37.0, 67.0, 50.0, 69.0, 75.0, 79.0, 75.0, 88.0, 60.0, 55.0, 47.0, 34.0, 25.0, 28.0, 13.0, 14.0, 9.0, 9.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0014410018920898438, -0.0014044567942619324, -0.001367911696434021, -0.0013313665986061096, -0.0012948215007781982, -0.0012582764029502869, -0.0012217313051223755, -0.0011851862072944641, -0.0011486411094665527, -0.0011120960116386414, -0.00107555091381073, -0.0010390058159828186, -0.0010024607181549072, -0.0009659156203269958, -0.0009293705224990845, -0.0008928254246711731, -0.0008562803268432617, -0.0008197352290153503, -0.000783190131187439, -0.0007466450333595276, -0.0007100999355316162, -0.0006735548377037048, -0.0006370097398757935, -0.0006004646420478821, -0.0005639195442199707, -0.0005273744463920593, -0.000490829348564148, -0.00045428425073623657, -0.0004177391529083252, -0.0003811940550804138, -0.00034464895725250244, -0.00030810385942459106, -0.0002715587615966797, -0.0002350136637687683, -0.00019846856594085693, -0.00016192346811294556, -0.00012537837028503418, -8.88332724571228e-05, -5.2288174629211426e-05, -1.574307680130005e-05, 2.0802021026611328e-05, 5.7347118854522705e-05, 9.389221668243408e-05, 0.00013043731451034546, 0.00016698241233825684, 0.0002035275101661682, 0.0002400726079940796, 0.00027661770582199097, 0.00031316280364990234, 0.0003497079014778137, 0.0003862529993057251, 0.0004227980971336365, 0.00045934319496154785, 0.0004958882927894592, 0.0005324333906173706, 0.000568978488445282, 0.0006055235862731934, 0.0006420686841011047, 0.0006786137819290161, 0.0007151588797569275, 0.0007517039775848389, 0.0007882490754127502, 0.0008247941732406616, 0.000861339271068573, 0.0008978843688964844]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 7.0, 5.0, 11.0, 10.0, 11.0, 23.0, 33.0, 39.0, 59.0, 105.0, 135.0, 232.0, 387.0, 849.0, 19140.0, 1009116.0, 16534.0, 816.0, 376.0, 220.0, 146.0, 86.0, 60.0, 49.0, 27.0, 20.0, 10.0, 11.0, 5.0, 8.0, 4.0, 4.0, 5.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01535797119140625, -0.01473081111907959, -0.01410365104675293, -0.01347649097442627, -0.01284933090209961, -0.01222217082977295, -0.011595010757446289, -0.010967850685119629, -0.010340690612792969, -0.009713530540466309, -0.009086370468139648, -0.008459210395812988, -0.007832050323486328, -0.007204890251159668, -0.006577730178833008, -0.005950570106506348, -0.0053234100341796875, -0.004696249961853027, -0.004069089889526367, -0.003441929817199707, -0.002814769744873047, -0.0021876096725463867, -0.0015604496002197266, -0.0009332895278930664, -0.00030612945556640625, 0.0003210306167602539, 0.0009481906890869141, 0.0015753507614135742, 0.0022025108337402344, 0.0028296709060668945, 0.0034568309783935547, 0.004083991050720215, 0.004711151123046875, 0.005338311195373535, 0.005965471267700195, 0.0065926313400268555, 0.007219791412353516, 0.007846951484680176, 0.008474111557006836, 0.009101271629333496, 0.009728431701660156, 0.010355591773986816, 0.010982751846313477, 0.011609911918640137, 0.012237071990966797, 0.012864232063293457, 0.013491392135620117, 0.014118552207946777, 0.014745712280273438, 0.015372872352600098, 0.016000032424926758, 0.016627192497253418, 0.017254352569580078, 0.01788151264190674, 0.0185086727142334, 0.01913583278656006, 0.01976299285888672, 0.02039015293121338, 0.02101731300354004, 0.0216444730758667, 0.02227163314819336, 0.02289879322052002, 0.02352595329284668, 0.02415311336517334, 0.0247802734375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 110.0, 490.0, 368.0, 39.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004035771358758211, -0.0039128875359892845, -0.0037900032475590706, -0.0036671191919595003, -0.00354423513635993, -0.0034213513135910034, -0.003298467257991433, -0.003175583202391863, -0.0030526991467922926, -0.0029298150911927223, -0.002806931035593152, -0.0026840469799935818, -0.002561163157224655, -0.0024382788687944412, -0.0023153950460255146, -0.0021925109904259443, -0.002069626934826374, -0.0019467428792268038, -0.0018238588236272335, -0.001700974884442985, -0.0015780908288434148, -0.0014552067732438445, -0.001332322834059596, -0.0012094387784600258, -0.0010865547228604555, -0.0009636706672608852, -0.0008407866698689759, -0.0007179026724770665, -0.0005950186168774962, -0.00047213456127792597, -0.0003492505638860166, -0.00022636656649410725, -0.00010348204523324966, 1.9401981262490153e-05, 0.00014228600775822997, 0.0002651700342539698, 0.0003880540607497096, 0.0005109381163492799, 0.0006338221137411892, 0.0007567061111330986, 0.0008795901667326689, 0.0010024742223322392, 0.0011253582779318094, 0.0012482422171160579, 0.0013711262727156281, 0.0014940103283151984, 0.0016168942674994469, 0.0017397783230990171, 0.0018626623786985874, 0.0019855464342981577, 0.002108430489897728, 0.0022313145454972982, 0.0023541986010968685, 0.002477082423865795, 0.0025999664794653654, 0.0027228505350649357, 0.002845734590664506, 0.0029686186462640762, 0.0030915027018636465, 0.0032143867574632168, 0.0033372705802321434, 0.0034601548686623573, 0.003583038691431284, 0.0037059227470308542, 0.0038288068026304245]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 7.0, 3.0, 5.0, 10.0, 11.0, 16.0, 19.0, 22.0, 23.0, 23.0, 38.0, 25.0, 32.0, 30.0, 31.0, 45.0, 37.0, 45.0, 53.0, 38.0, 51.0, 46.0, 35.0, 57.0, 31.0, 46.0, 38.0, 23.0, 34.0, 19.0, 20.0, 22.0, 22.0, 12.0, 5.0, 10.0, 8.0, 5.0, 5.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005851984024047852, -0.0005677500739693642, -0.0005503017455339432, -0.0005328534170985222, -0.0005154050886631012, -0.0004979567602276802, -0.0004805084317922592, -0.0004630601033568382, -0.00044561177492141724, -0.00042816344648599625, -0.00041071511805057526, -0.00039326678961515427, -0.0003758184611797333, -0.0003583701327443123, -0.0003409218043088913, -0.0003234734758734703, -0.0003060251474380493, -0.0002885768190026283, -0.00027112849056720734, -0.00025368016213178635, -0.00023623183369636536, -0.00021878350526094437, -0.00020133517682552338, -0.0001838868483901024, -0.0001664385199546814, -0.0001489901915192604, -0.00013154186308383942, -0.00011409353464841843, -9.664520621299744e-05, -7.919687777757645e-05, -6.174854934215546e-05, -4.4300220906734467e-05, -2.6851892471313477e-05, -9.403564035892487e-06, 8.044764399528503e-06, 2.5493092834949493e-05, 4.2941421270370483e-05, 6.0389749705791473e-05, 7.783807814121246e-05, 9.528640657663345e-05, 0.00011273473501205444, 0.00013018306344747543, 0.00014763139188289642, 0.0001650797203183174, 0.0001825280487537384, 0.0001999763771891594, 0.00021742470562458038, 0.00023487303406000137, 0.00025232136249542236, 0.00026976969093084335, 0.00028721801936626434, 0.00030466634780168533, 0.0003221146762371063, 0.0003395630046725273, 0.0003570113331079483, 0.0003744596615433693, 0.0003919079899787903, 0.0004093563184142113, 0.00042680464684963226, 0.00044425297528505325, 0.00046170130372047424, 0.00047914963215589523, 0.0004965979605913162, 0.0005140462890267372, 0.0005314946174621582]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 4.0, 6.0, 8.0, 9.0, 9.0, 7.0, 12.0, 19.0, 18.0, 28.0, 21.0, 27.0, 32.0, 45.0, 52.0, 55.0, 44.0, 61.0, 53.0, 35.0, 46.0, 50.0, 45.0, 43.0, 37.0, 34.0, 26.0, 26.0, 34.0, 20.0, 18.0, 16.0, 17.0, 8.0, 11.0, 7.0, 5.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.91796875, -4.76983642578125, -4.6217041015625, -4.47357177734375, -4.325439453125, -4.17730712890625, -4.0291748046875, -3.88104248046875, -3.73291015625, -3.58477783203125, -3.4366455078125, -3.28851318359375, -3.140380859375, -2.99224853515625, -2.8441162109375, -2.69598388671875, -2.5478515625, -2.39971923828125, -2.2515869140625, -2.10345458984375, -1.955322265625, -1.80718994140625, -1.6590576171875, -1.51092529296875, -1.36279296875, -1.21466064453125, -1.0665283203125, -0.91839599609375, -0.770263671875, -0.62213134765625, -0.4739990234375, -0.32586669921875, -0.177734375, -0.02960205078125, 0.1185302734375, 0.26666259765625, 0.414794921875, 0.56292724609375, 0.7110595703125, 0.85919189453125, 1.00732421875, 1.15545654296875, 1.3035888671875, 1.45172119140625, 1.599853515625, 1.74798583984375, 1.8961181640625, 2.04425048828125, 2.1923828125, 2.34051513671875, 2.4886474609375, 2.63677978515625, 2.784912109375, 2.93304443359375, 3.0811767578125, 3.22930908203125, 3.37744140625, 3.52557373046875, 3.6737060546875, 3.82183837890625, 3.969970703125, 4.11810302734375, 4.2662353515625, 4.41436767578125, 4.5625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 11.0, 5.0, 10.0, 17.0, 18.0, 21.0, 31.0, 38.0, 53.0, 114.0, 145.0, 253.0, 441.0, 806.0, 1551.0, 3030.0, 5876.0, 11714.0, 25022.0, 63039.0, 204481.0, 423538.0, 198432.0, 61572.0, 24628.0, 11459.0, 5871.0, 2882.0, 1502.0, 857.0, 430.0, 251.0, 164.0, 70.0, 70.0, 48.0, 34.0, 18.0, 17.0, 13.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.5625, -4.40234375, -4.2421875, -4.08203125, -3.921875, -3.76171875, -3.6015625, -3.44140625, -3.28125, -3.12109375, -2.9609375, -2.80078125, -2.640625, -2.48046875, -2.3203125, -2.16015625, -2.0, -1.83984375, -1.6796875, -1.51953125, -1.359375, -1.19921875, -1.0390625, -0.87890625, -0.71875, -0.55859375, -0.3984375, -0.23828125, -0.078125, 0.08203125, 0.2421875, 0.40234375, 0.5625, 0.72265625, 0.8828125, 1.04296875, 1.203125, 1.36328125, 1.5234375, 1.68359375, 1.84375, 2.00390625, 2.1640625, 2.32421875, 2.484375, 2.64453125, 2.8046875, 2.96484375, 3.125, 3.28515625, 3.4453125, 3.60546875, 3.765625, 3.92578125, 4.0859375, 4.24609375, 4.40625, 4.56640625, 4.7265625, 4.88671875, 5.046875, 5.20703125, 5.3671875, 5.52734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 5.0, 6.0, 2.0, 6.0, 9.0, 13.0, 12.0, 13.0, 20.0, 25.0, 29.0, 34.0, 36.0, 40.0, 48.0, 68.0, 141.0, 251.0, 1511.0, 265.0, 110.0, 73.0, 59.0, 41.0, 27.0, 36.0, 33.0, 29.0, 20.0, 21.0, 17.0, 13.0, 8.0, 8.0, 8.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.75, -19.1932373046875, -18.636474609375, -18.0797119140625, -17.52294921875, -16.9661865234375, -16.409423828125, -15.8526611328125, -15.2958984375, -14.7391357421875, -14.182373046875, -13.6256103515625, -13.06884765625, -12.5120849609375, -11.955322265625, -11.3985595703125, -10.841796875, -10.2850341796875, -9.728271484375, -9.1715087890625, -8.61474609375, -8.0579833984375, -7.501220703125, -6.9444580078125, -6.3876953125, -5.8309326171875, -5.274169921875, -4.7174072265625, -4.16064453125, -3.6038818359375, -3.047119140625, -2.4903564453125, -1.93359375, -1.3768310546875, -0.820068359375, -0.2633056640625, 0.29345703125, 0.8502197265625, 1.406982421875, 1.9637451171875, 2.5205078125, 3.0772705078125, 3.634033203125, 4.1907958984375, 4.74755859375, 5.3043212890625, 5.861083984375, 6.4178466796875, 6.974609375, 7.5313720703125, 8.088134765625, 8.6448974609375, 9.20166015625, 9.7584228515625, 10.315185546875, 10.8719482421875, 11.4287109375, 11.9854736328125, 12.542236328125, 13.0989990234375, 13.65576171875, 14.2125244140625, 14.769287109375, 15.3260498046875, 15.8828125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 2.0, 4.0, 6.0, 13.0, 14.0, 16.0, 21.0, 29.0, 36.0, 39.0, 77.0, 112.0, 186.0, 271.0, 562.0, 2331.0, 135086.0, 2992731.0, 12180.0, 952.0, 372.0, 226.0, 116.0, 81.0, 64.0, 49.0, 28.0, 24.0, 19.0, 12.0, 9.0, 9.0, 5.0, 5.0, 6.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.65625, -39.31298828125, -37.9697265625, -36.62646484375, -35.283203125, -33.93994140625, -32.5966796875, -31.25341796875, -29.91015625, -28.56689453125, -27.2236328125, -25.88037109375, -24.537109375, -23.19384765625, -21.8505859375, -20.50732421875, -19.1640625, -17.82080078125, -16.4775390625, -15.13427734375, -13.791015625, -12.44775390625, -11.1044921875, -9.76123046875, -8.41796875, -7.07470703125, -5.7314453125, -4.38818359375, -3.044921875, -1.70166015625, -0.3583984375, 0.98486328125, 2.328125, 3.67138671875, 5.0146484375, 6.35791015625, 7.701171875, 9.04443359375, 10.3876953125, 11.73095703125, 13.07421875, 14.41748046875, 15.7607421875, 17.10400390625, 18.447265625, 19.79052734375, 21.1337890625, 22.47705078125, 23.8203125, 25.16357421875, 26.5068359375, 27.85009765625, 29.193359375, 30.53662109375, 31.8798828125, 33.22314453125, 34.56640625, 35.90966796875, 37.2529296875, 38.59619140625, 39.939453125, 41.28271484375, 42.6259765625, 43.96923828125, 45.3125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 34.0, 122.0, 303.0, 315.0, 181.0, 45.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.525617599487305, -26.355003356933594, -24.18438720703125, -22.01377296447754, -19.843158721923828, -17.672542572021484, -15.501928329467773, -13.331313133239746, -11.160697937011719, -8.990082740783691, -6.819468021392822, -4.648853302001953, -2.478238105773926, -0.30762290954589844, 1.8629913330078125, 4.03360652923584, 6.204221725463867, 8.374836921691895, 10.545452117919922, 12.716066360473633, 14.88668155670166, 17.057296752929688, 19.2279109954834, 21.39852523803711, 23.569141387939453, 25.739755630493164, 27.910371780395508, 30.08098602294922, 32.25160217285156, 34.422218322753906, 36.592830657958984, 38.76344680786133, 40.93406677246094, 43.10468292236328, 45.27529525756836, 47.4459114074707, 49.61652755737305, 51.787139892578125, 53.95775604248047, 56.12837219238281, 58.298988342285156, 60.4696044921875, 62.64021682739258, 64.81083679199219, 66.9814453125, 69.15206146240234, 71.32267761230469, 73.49329376220703, 75.66390991210938, 77.83452606201172, 80.00514221191406, 82.17575073242188, 84.34636688232422, 86.51698303222656, 88.6875991821289, 90.85821533203125, 93.02882385253906, 95.1994400024414, 97.37005615234375, 99.54066467285156, 101.7112808227539, 103.88189697265625, 106.0525131225586, 108.22312927246094, 110.39374542236328]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 8.0, 12.0, 16.0, 12.0, 14.0, 19.0, 26.0, 18.0, 29.0, 28.0, 36.0, 32.0, 35.0, 38.0, 44.0, 46.0, 39.0, 37.0, 37.0, 47.0, 45.0, 37.0, 42.0, 29.0, 33.0, 30.0, 31.0, 29.0, 25.0, 15.0, 18.0, 13.0, 15.0, 13.0, 12.0, 7.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.598392486572266, -38.39763641357422, -37.19688034057617, -35.99612045288086, -34.79536437988281, -33.594608306884766, -32.39385223388672, -31.193096160888672, -29.992338180541992, -28.791582107543945, -27.590824127197266, -26.39006805419922, -25.189311981201172, -23.988554000854492, -22.787797927856445, -21.587039947509766, -20.38628387451172, -19.185527801513672, -17.984769821166992, -16.784013748168945, -15.583256721496582, -14.382499694824219, -13.181743621826172, -11.980986595153809, -10.780229568481445, -9.579472541809082, -8.378715515136719, -7.177959442138672, -5.977202415466309, -4.776445388793945, -3.5756888389587402, -2.374932289123535, -1.1741714477539062, 0.02658534049987793, 1.227342128753662, 2.4280989170074463, 3.6288557052612305, 4.829612731933594, 6.030369281768799, 7.231125831604004, 8.431882858276367, 9.63263988494873, 10.833396911621094, 12.03415298461914, 13.234910011291504, 14.435667037963867, 15.636423110961914, 16.837181091308594, 18.03793716430664, 19.238693237304688, 20.439451217651367, 21.640207290649414, 22.840965270996094, 24.04172134399414, 25.242477416992188, 26.443233489990234, 27.643991470336914, 28.84474754333496, 30.04550552368164, 31.246261596679688, 32.447017669677734, 33.64777374267578, 34.848533630371094, 36.04928970336914, 37.25004577636719]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 5.0, 11.0, 2.0, 7.0, 18.0, 18.0, 22.0, 40.0, 26.0, 31.0, 41.0, 40.0, 45.0, 52.0, 37.0, 51.0, 67.0, 44.0, 49.0, 42.0, 31.0, 41.0, 47.0, 31.0, 34.0, 22.0, 27.0, 18.0, 20.0, 13.0, 8.0, 15.0, 10.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.17578125, -5.01776123046875, -4.8597412109375, -4.70172119140625, -4.543701171875, -4.38568115234375, -4.2276611328125, -4.06964111328125, -3.91162109375, -3.75360107421875, -3.5955810546875, -3.43756103515625, -3.279541015625, -3.12152099609375, -2.9635009765625, -2.80548095703125, -2.6474609375, -2.48944091796875, -2.3314208984375, -2.17340087890625, -2.015380859375, -1.85736083984375, -1.6993408203125, -1.54132080078125, -1.38330078125, -1.22528076171875, -1.0672607421875, -0.90924072265625, -0.751220703125, -0.59320068359375, -0.4351806640625, -0.27716064453125, -0.119140625, 0.03887939453125, 0.1968994140625, 0.35491943359375, 0.512939453125, 0.67095947265625, 0.8289794921875, 0.98699951171875, 1.14501953125, 1.30303955078125, 1.4610595703125, 1.61907958984375, 1.777099609375, 1.93511962890625, 2.0931396484375, 2.25115966796875, 2.4091796875, 2.56719970703125, 2.7252197265625, 2.88323974609375, 3.041259765625, 3.19927978515625, 3.3572998046875, 3.51531982421875, 3.67333984375, 3.83135986328125, 3.9893798828125, 4.14739990234375, 4.305419921875, 4.46343994140625, 4.6214599609375, 4.77947998046875, 4.9375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 17.0, 13.0, 14.0, 16.0, 26.0, 31.0, 37.0, 54.0, 46.0, 75.0, 109.0, 142.0, 343.0, 1062.0, 9354.0, 375798.0, 3552837.0, 245623.0, 6969.0, 860.0, 264.0, 125.0, 103.0, 63.0, 63.0, 33.0, 38.0, 35.0, 30.0, 22.0, 13.0, 8.0, 11.0, 7.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.4375, -20.796630859375, -20.15576171875, -19.514892578125, -18.8740234375, -18.233154296875, -17.59228515625, -16.951416015625, -16.310546875, -15.669677734375, -15.02880859375, -14.387939453125, -13.7470703125, -13.106201171875, -12.46533203125, -11.824462890625, -11.18359375, -10.542724609375, -9.90185546875, -9.260986328125, -8.6201171875, -7.979248046875, -7.33837890625, -6.697509765625, -6.056640625, -5.415771484375, -4.77490234375, -4.134033203125, -3.4931640625, -2.852294921875, -2.21142578125, -1.570556640625, -0.9296875, -0.288818359375, 0.35205078125, 0.992919921875, 1.6337890625, 2.274658203125, 2.91552734375, 3.556396484375, 4.197265625, 4.838134765625, 5.47900390625, 6.119873046875, 6.7607421875, 7.401611328125, 8.04248046875, 8.683349609375, 9.32421875, 9.965087890625, 10.60595703125, 11.246826171875, 11.8876953125, 12.528564453125, 13.16943359375, 13.810302734375, 14.451171875, 15.092041015625, 15.73291015625, 16.373779296875, 17.0146484375, 17.655517578125, 18.29638671875, 18.937255859375, 19.578125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 7.0, 12.0, 18.0, 26.0, 51.0, 73.0, 128.0, 215.0, 385.0, 580.0, 738.0, 704.0, 430.0, 297.0, 174.0, 109.0, 59.0, 26.0, 16.0, 16.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.765625, -13.185302734375, -12.60498046875, -12.024658203125, -11.4443359375, -10.864013671875, -10.28369140625, -9.703369140625, -9.123046875, -8.542724609375, -7.96240234375, -7.382080078125, -6.8017578125, -6.221435546875, -5.64111328125, -5.060791015625, -4.48046875, -3.900146484375, -3.31982421875, -2.739501953125, -2.1591796875, -1.578857421875, -0.99853515625, -0.418212890625, 0.162109375, 0.742431640625, 1.32275390625, 1.903076171875, 2.4833984375, 3.063720703125, 3.64404296875, 4.224365234375, 4.8046875, 5.385009765625, 5.96533203125, 6.545654296875, 7.1259765625, 7.706298828125, 8.28662109375, 8.866943359375, 9.447265625, 10.027587890625, 10.60791015625, 11.188232421875, 11.7685546875, 12.348876953125, 12.92919921875, 13.509521484375, 14.08984375, 14.670166015625, 15.25048828125, 15.830810546875, 16.4111328125, 16.991455078125, 17.57177734375, 18.152099609375, 18.732421875, 19.312744140625, 19.89306640625, 20.473388671875, 21.0537109375, 21.634033203125, 22.21435546875, 22.794677734375, 23.375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 13.0, 16.0, 27.0, 52.0, 83.0, 193.0, 389.0, 867.0, 8311.0, 2760090.0, 1417664.0, 5061.0, 791.0, 330.0, 169.0, 102.0, 55.0, 21.0, 23.0, 11.0, 2.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-65.4375, -63.8388671875, -62.240234375, -60.6416015625, -59.04296875, -57.4443359375, -55.845703125, -54.2470703125, -52.6484375, -51.0498046875, -49.451171875, -47.8525390625, -46.25390625, -44.6552734375, -43.056640625, -41.4580078125, -39.859375, -38.2607421875, -36.662109375, -35.0634765625, -33.46484375, -31.8662109375, -30.267578125, -28.6689453125, -27.0703125, -25.4716796875, -23.873046875, -22.2744140625, -20.67578125, -19.0771484375, -17.478515625, -15.8798828125, -14.28125, -12.6826171875, -11.083984375, -9.4853515625, -7.88671875, -6.2880859375, -4.689453125, -3.0908203125, -1.4921875, 0.1064453125, 1.705078125, 3.3037109375, 4.90234375, 6.5009765625, 8.099609375, 9.6982421875, 11.296875, 12.8955078125, 14.494140625, 16.0927734375, 17.69140625, 19.2900390625, 20.888671875, 22.4873046875, 24.0859375, 25.6845703125, 27.283203125, 28.8818359375, 30.48046875, 32.0791015625, 33.677734375, 35.2763671875, 36.875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 6.0, 11.0, 13.0, 23.0, 25.0, 36.0, 50.0, 51.0, 64.0, 60.0, 82.0, 86.0, 70.0, 74.0, 77.0, 63.0, 51.0, 27.0, 33.0, 32.0, 20.0, 12.0, 13.0, 10.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.672157287597656, -34.4562873840332, -33.240421295166016, -32.02455139160156, -30.80868148803711, -29.59281349182129, -28.37694549560547, -27.161075592041016, -25.945207595825195, -24.729339599609375, -23.513469696044922, -22.2976016998291, -21.08173370361328, -19.865863800048828, -18.649995803833008, -17.434127807617188, -16.218257904052734, -15.002388954162598, -13.786520004272461, -12.57065200805664, -11.354783058166504, -10.138914108276367, -8.923046112060547, -7.70717716217041, -6.491308212280273, -5.275439262390137, -4.059570789337158, -2.8437020778656006, -1.627833366394043, -0.41196441650390625, 0.8039040565490723, 2.019772529602051, 3.235645294189453, 4.45151424407959, 5.667382717132568, 6.883251190185547, 8.099120140075684, 9.31498908996582, 10.53085708618164, 11.746726036071777, 12.962594985961914, 14.17846393585205, 15.394332885742188, 16.610200881958008, 17.826068878173828, 19.04193878173828, 20.2578067779541, 21.473674774169922, 22.689544677734375, 23.905412673950195, 25.12128257751465, 26.33715057373047, 27.553020477294922, 28.768888473510742, 29.984756469726562, 31.200626373291016, 32.41649627685547, 33.63236618041992, 34.84823226928711, 36.06410217285156, 37.279972076416016, 38.49584197998047, 39.711708068847656, 40.92757797241211, 42.1434440612793]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 11.0, 9.0, 12.0, 23.0, 14.0, 21.0, 17.0, 27.0, 18.0, 37.0, 33.0, 36.0, 26.0, 34.0, 51.0, 33.0, 46.0, 38.0, 37.0, 43.0, 49.0, 43.0, 28.0, 41.0, 35.0, 31.0, 22.0, 35.0, 23.0, 20.0, 23.0, 12.0, 12.0, 6.0, 9.0, 12.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.93120574951172, -36.79109191894531, -35.650978088378906, -34.5108642578125, -33.370750427246094, -32.23063659667969, -31.090524673461914, -29.950410842895508, -28.8102970123291, -27.670183181762695, -26.53006935119629, -25.389955520629883, -24.24984359741211, -23.109729766845703, -21.969615936279297, -20.82950210571289, -19.689388275146484, -18.549274444580078, -17.409160614013672, -16.269046783447266, -15.128933906555176, -13.98882007598877, -12.84870719909668, -11.708593368530273, -10.568479537963867, -9.428365707397461, -8.288251876831055, -7.148138999938965, -6.008025169372559, -4.867911338806152, -3.7277979850769043, -2.5876846313476562, -1.4475746154785156, -0.3074610233306885, 0.8326525688171387, 1.9727661609649658, 3.112879753112793, 4.252993583679199, 5.393106937408447, 6.533220291137695, 7.673334121704102, 8.813447952270508, 9.953561782836914, 11.093674659729004, 12.23378849029541, 13.373902320861816, 14.514015197753906, 15.654129028320312, 16.79424285888672, 17.934356689453125, 19.07447052001953, 20.214584350585938, 21.354698181152344, 22.49481201171875, 23.634923934936523, 24.77503776550293, 25.915151596069336, 27.055265426635742, 28.19537925720215, 29.335493087768555, 30.475605010986328, 31.615718841552734, 32.75583267211914, 33.89594650268555, 35.03606033325195]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 8.0, 8.0, 9.0, 9.0, 14.0, 14.0, 25.0, 23.0, 34.0, 46.0, 46.0, 40.0, 46.0, 50.0, 55.0, 39.0, 36.0, 46.0, 54.0, 41.0, 44.0, 35.0, 32.0, 48.0, 36.0, 23.0, 20.0, 20.0, 18.0, 15.0, 12.0, 4.0, 9.0, 4.0, 12.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.16796875, -5.00970458984375, -4.8514404296875, -4.69317626953125, -4.534912109375, -4.37664794921875, -4.2183837890625, -4.06011962890625, -3.90185546875, -3.74359130859375, -3.5853271484375, -3.42706298828125, -3.268798828125, -3.11053466796875, -2.9522705078125, -2.79400634765625, -2.6357421875, -2.47747802734375, -2.3192138671875, -2.16094970703125, -2.002685546875, -1.84442138671875, -1.6861572265625, -1.52789306640625, -1.36962890625, -1.21136474609375, -1.0531005859375, -0.89483642578125, -0.736572265625, -0.57830810546875, -0.4200439453125, -0.26177978515625, -0.103515625, 0.05474853515625, 0.2130126953125, 0.37127685546875, 0.529541015625, 0.68780517578125, 0.8460693359375, 1.00433349609375, 1.16259765625, 1.32086181640625, 1.4791259765625, 1.63739013671875, 1.795654296875, 1.95391845703125, 2.1121826171875, 2.27044677734375, 2.4287109375, 2.58697509765625, 2.7452392578125, 2.90350341796875, 3.061767578125, 3.22003173828125, 3.3782958984375, 3.53656005859375, 3.69482421875, 3.85308837890625, 4.0113525390625, 4.16961669921875, 4.327880859375, 4.48614501953125, 4.6444091796875, 4.80267333984375, 4.9609375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 10.0, 10.0, 15.0, 21.0, 45.0, 59.0, 86.0, 149.0, 220.0, 326.0, 541.0, 844.0, 1331.0, 2026.0, 3424.0, 5282.0, 8457.0, 13616.0, 22628.0, 36920.0, 59712.0, 95604.0, 147922.0, 196096.0, 164943.0, 108651.0, 68596.0, 42749.0, 26209.0, 16124.0, 9801.0, 6028.0, 3671.0, 2369.0, 1479.0, 919.0, 600.0, 388.0, 237.0, 153.0, 106.0, 68.0, 39.0, 23.0, 27.0, 14.0, 12.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.34717559814453125, -0.3354644775390625, -0.32375335693359375, -0.312042236328125, -0.30033111572265625, -0.2886199951171875, -0.27690887451171875, -0.26519775390625, -0.25348663330078125, -0.2417755126953125, -0.23006439208984375, -0.218353271484375, -0.20664215087890625, -0.1949310302734375, -0.18321990966796875, -0.1715087890625, -0.15979766845703125, -0.1480865478515625, -0.13637542724609375, -0.124664306640625, -0.11295318603515625, -0.1012420654296875, -0.08953094482421875, -0.07781982421875, -0.06610870361328125, -0.0543975830078125, -0.04268646240234375, -0.030975341796875, -0.01926422119140625, -0.0075531005859375, 0.00415802001953125, 0.015869140625, 0.02758026123046875, 0.0392913818359375, 0.05100250244140625, 0.062713623046875, 0.07442474365234375, 0.0861358642578125, 0.09784698486328125, 0.10955810546875, 0.12126922607421875, 0.1329803466796875, 0.14469146728515625, 0.156402587890625, 0.16811370849609375, 0.1798248291015625, 0.19153594970703125, 0.2032470703125, 0.21495819091796875, 0.2266693115234375, 0.23838043212890625, 0.250091552734375, 0.26180267333984375, 0.2735137939453125, 0.28522491455078125, 0.29693603515625, 0.30864715576171875, 0.3203582763671875, 0.33206939697265625, 0.343780517578125, 0.35549163818359375, 0.3672027587890625, 0.37891387939453125, 0.390625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 5.0, 9.0, 5.0, 9.0, 12.0, 17.0, 21.0, 22.0, 26.0, 33.0, 33.0, 29.0, 27.0, 31.0, 39.0, 40.0, 38.0, 40.0, 46.0, 1057.0, 43.0, 45.0, 31.0, 33.0, 47.0, 37.0, 27.0, 23.0, 22.0, 25.0, 21.0, 19.0, 15.0, 9.0, 11.0, 11.0, 13.0, 11.0, 6.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.578125, -2.492950439453125, -2.40777587890625, -2.322601318359375, -2.2374267578125, -2.152252197265625, -2.06707763671875, -1.981903076171875, -1.896728515625, -1.811553955078125, -1.72637939453125, -1.641204833984375, -1.5560302734375, -1.470855712890625, -1.38568115234375, -1.300506591796875, -1.21533203125, -1.130157470703125, -1.04498291015625, -0.959808349609375, -0.8746337890625, -0.789459228515625, -0.70428466796875, -0.619110107421875, -0.533935546875, -0.448760986328125, -0.36358642578125, -0.278411865234375, -0.1932373046875, -0.108062744140625, -0.02288818359375, 0.062286376953125, 0.1474609375, 0.232635498046875, 0.31781005859375, 0.402984619140625, 0.4881591796875, 0.573333740234375, 0.65850830078125, 0.743682861328125, 0.828857421875, 0.914031982421875, 0.99920654296875, 1.084381103515625, 1.1695556640625, 1.254730224609375, 1.33990478515625, 1.425079345703125, 1.51025390625, 1.595428466796875, 1.68060302734375, 1.765777587890625, 1.8509521484375, 1.936126708984375, 2.02130126953125, 2.106475830078125, 2.191650390625, 2.276824951171875, 2.36199951171875, 2.447174072265625, 2.5323486328125, 2.617523193359375, 2.70269775390625, 2.787872314453125, 2.873046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 10.0, 13.0, 19.0, 34.0, 35.0, 60.0, 99.0, 123.0, 218.0, 298.0, 471.0, 633.0, 974.0, 1500.0, 2274.0, 3240.0, 4828.0, 7398.0, 10955.0, 16239.0, 24049.0, 35991.0, 53282.0, 79037.0, 114201.0, 151178.0, 1200487.0, 122739.0, 87554.0, 58947.0, 39726.0, 26355.0, 17846.0, 11899.0, 7986.0, 5326.0, 3643.0, 2457.0, 1623.0, 1055.0, 797.0, 552.0, 296.0, 234.0, 157.0, 96.0, 62.0, 35.0, 37.0, 19.0, 19.0, 8.0, 10.0, 6.0, 3.0, 2.0, 1.0], "bins": [-0.261962890625, -0.25405311584472656, -0.24614334106445312, -0.2382335662841797, -0.23032379150390625, -0.2224140167236328, -0.21450424194335938, -0.20659446716308594, -0.1986846923828125, -0.19077491760253906, -0.18286514282226562, -0.1749553680419922, -0.16704559326171875, -0.1591358184814453, -0.15122604370117188, -0.14331626892089844, -0.135406494140625, -0.12749671936035156, -0.11958694458007812, -0.11167716979980469, -0.10376739501953125, -0.09585762023925781, -0.08794784545898438, -0.08003807067871094, -0.0721282958984375, -0.06421852111816406, -0.056308746337890625, -0.04839897155761719, -0.04048919677734375, -0.03257942199707031, -0.024669647216796875, -0.016759872436523438, -0.00885009765625, -0.0009403228759765625, 0.006969451904296875, 0.014879226684570312, 0.02278900146484375, 0.030698776245117188, 0.038608551025390625, 0.04651832580566406, 0.0544281005859375, 0.06233787536621094, 0.07024765014648438, 0.07815742492675781, 0.08606719970703125, 0.09397697448730469, 0.10188674926757812, 0.10979652404785156, 0.117706298828125, 0.12561607360839844, 0.13352584838867188, 0.1414356231689453, 0.14934539794921875, 0.1572551727294922, 0.16516494750976562, 0.17307472229003906, 0.1809844970703125, 0.18889427185058594, 0.19680404663085938, 0.2047138214111328, 0.21262359619140625, 0.2205333709716797, 0.22844314575195312, 0.23635292053222656, 0.2442626953125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 8.0, 6.0, 8.0, 6.0, 11.0, 17.0, 16.0, 22.0, 17.0, 27.0, 39.0, 26.0, 39.0, 35.0, 41.0, 41.0, 53.0, 53.0, 58.0, 42.0, 41.0, 48.0, 58.0, 38.0, 40.0, 37.0, 36.0, 21.0, 18.0, 13.0, 9.0, 13.0, 17.0, 10.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.000743865966796875, -0.0007175654172897339, -0.0006912648677825928, -0.0006649643182754517, -0.0006386637687683105, -0.0006123632192611694, -0.0005860626697540283, -0.0005597621202468872, -0.0005334615707397461, -0.000507161021232605, -0.00048086047172546387, -0.00045455992221832275, -0.00042825937271118164, -0.00040195882320404053, -0.0003756582736968994, -0.0003493577241897583, -0.0003230571746826172, -0.0002967566251754761, -0.00027045607566833496, -0.00024415552616119385, -0.00021785497665405273, -0.00019155442714691162, -0.0001652538776397705, -0.0001389533281326294, -0.00011265277862548828, -8.635222911834717e-05, -6.0051679611206055e-05, -3.375113010406494e-05, -7.450580596923828e-06, 1.8849968910217285e-05, 4.51505184173584e-05, 7.145106792449951e-05, 9.775161743164062e-05, 0.00012405216693878174, 0.00015035271644592285, 0.00017665326595306396, 0.00020295381546020508, 0.0002292543649673462, 0.0002555549144744873, 0.0002818554639816284, 0.00030815601348876953, 0.00033445656299591064, 0.00036075711250305176, 0.00038705766201019287, 0.000413358211517334, 0.0004396587610244751, 0.0004659593105316162, 0.0004922598600387573, 0.0005185604095458984, 0.0005448609590530396, 0.0005711615085601807, 0.0005974620580673218, 0.0006237626075744629, 0.000650063157081604, 0.0006763637065887451, 0.0007026642560958862, 0.0007289648056030273, 0.0007552653551101685, 0.0007815659046173096, 0.0008078664541244507, 0.0008341670036315918, 0.0008604675531387329, 0.000886768102645874, 0.0009130686521530151, 0.0009393692016601562]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 5.0, 9.0, 11.0, 13.0, 14.0, 25.0, 31.0, 34.0, 40.0, 67.0, 106.0, 156.0, 202.0, 311.0, 511.0, 1421.0, 37662.0, 946986.0, 57628.0, 1739.0, 540.0, 318.0, 183.0, 125.0, 103.0, 68.0, 44.0, 45.0, 30.0, 21.0, 21.0, 26.0, 13.0, 6.0, 8.0, 11.0, 6.0, 0.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01715087890625, -0.016654372215270996, -0.016157865524291992, -0.01566135883331299, -0.015164852142333984, -0.01466834545135498, -0.014171838760375977, -0.013675332069396973, -0.013178825378417969, -0.012682318687438965, -0.012185811996459961, -0.011689305305480957, -0.011192798614501953, -0.01069629192352295, -0.010199785232543945, -0.009703278541564941, -0.009206771850585938, -0.008710265159606934, -0.00821375846862793, -0.007717251777648926, -0.007220745086669922, -0.006724238395690918, -0.006227731704711914, -0.00573122501373291, -0.005234718322753906, -0.004738211631774902, -0.0042417049407958984, -0.0037451982498168945, -0.0032486915588378906, -0.0027521848678588867, -0.002255678176879883, -0.001759171485900879, -0.001262664794921875, -0.0007661581039428711, -0.0002696514129638672, 0.00022685527801513672, 0.0007233619689941406, 0.0012198686599731445, 0.0017163753509521484, 0.0022128820419311523, 0.0027093887329101562, 0.00320589542388916, 0.003702402114868164, 0.004198908805847168, 0.004695415496826172, 0.005191922187805176, 0.00568842887878418, 0.006184935569763184, 0.0066814422607421875, 0.007177948951721191, 0.007674455642700195, 0.0081709623336792, 0.008667469024658203, 0.009163975715637207, 0.009660482406616211, 0.010156989097595215, 0.010653495788574219, 0.011150002479553223, 0.011646509170532227, 0.01214301586151123, 0.012639522552490234, 0.013136029243469238, 0.013632535934448242, 0.014129042625427246, 0.01462554931640625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 12.0, 21.0, 36.0, 73.0, 91.0, 151.0, 152.0, 155.0, 107.0, 87.0, 50.0, 25.0, 20.0, 8.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012561699841171503, -0.0012219747295603156, -0.0011877795914188027, -0.001153584336861968, -0.0011193891987204552, -0.0010851939441636205, -0.0010509986896067858, -0.001016803551465273, -0.0009826082969084382, -0.0009484131005592644, -0.0009142179042100906, -0.0008800226496532559, -0.0008458274533040822, -0.0008116322569549084, -0.0007774370606057346, -0.0007432418642565608, -0.000709046667907387, -0.0006748514715582132, -0.0006406562752090394, -0.0006064610788598657, -0.000572265824303031, -0.0005380706279538572, -0.0005038754316046834, -0.0004696802352555096, -0.0004354850098025054, -0.0004012898134533316, -0.00036709458800032735, -0.00033289939165115356, -0.0002987041953019798, -0.00026450896984897554, -0.00023031377349980175, -0.00019611856259871274, -0.00016192340990528464, -0.00012772819900419563, -9.353299537906423e-05, -5.9337791753932834e-05, -2.514258085284382e-05, 9.052630048245192e-06, 4.3247826397418976e-05, 7.744303729850799e-05, 0.000111638248199597, 0.00014583345910068601, 0.00018002867000177503, 0.0002142238663509488, 0.0002484190627001226, 0.00028261428815312684, 0.0003168094845023006, 0.00035100470995530486, 0.00038519990630447865, 0.00041939510265365243, 0.00045359032810665667, 0.00048778552445583045, 0.0005219807499088347, 0.0005561759462580085, 0.0005903711426071823, 0.000624566338956356, 0.0006587615935131907, 0.0006929567898623645, 0.0007271519862115383, 0.000761347240768373, 0.0007955424371175468, 0.0008297376334667206, 0.0008639328298158944, 0.0008981280261650681, 0.0009323232225142419]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 14.0, 6.0, 13.0, 16.0, 13.0, 14.0, 12.0, 24.0, 21.0, 36.0, 21.0, 26.0, 26.0, 36.0, 36.0, 38.0, 38.0, 51.0, 33.0, 49.0, 37.0, 38.0, 40.0, 39.0, 33.0, 33.0, 30.0, 27.0, 24.0, 29.0, 22.0, 26.0, 14.0, 15.0, 9.0, 12.0, 10.0, 3.0, 5.0, 3.0, 5.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00047218799591064453, -0.0004574321210384369, -0.00044267624616622925, -0.0004279203712940216, -0.00041316449642181396, -0.0003984086215496063, -0.0003836527466773987, -0.00036889687180519104, -0.0003541409969329834, -0.00033938512206077576, -0.0003246292471885681, -0.0003098733723163605, -0.00029511749744415283, -0.0002803616225719452, -0.00026560574769973755, -0.0002508498728275299, -0.00023609399795532227, -0.00022133812308311462, -0.00020658224821090698, -0.00019182637333869934, -0.0001770704984664917, -0.00016231462359428406, -0.00014755874872207642, -0.00013280287384986877, -0.00011804699897766113, -0.00010329112410545349, -8.853524923324585e-05, -7.377937436103821e-05, -5.9023499488830566e-05, -4.4267624616622925e-05, -2.9511749744415283e-05, -1.4755874872207642e-05, 0.0, 1.4755874872207642e-05, 2.9511749744415283e-05, 4.4267624616622925e-05, 5.9023499488830566e-05, 7.377937436103821e-05, 8.853524923324585e-05, 0.00010329112410545349, 0.00011804699897766113, 0.00013280287384986877, 0.00014755874872207642, 0.00016231462359428406, 0.0001770704984664917, 0.00019182637333869934, 0.00020658224821090698, 0.00022133812308311462, 0.00023609399795532227, 0.0002508498728275299, 0.00026560574769973755, 0.0002803616225719452, 0.00029511749744415283, 0.0003098733723163605, 0.0003246292471885681, 0.00033938512206077576, 0.0003541409969329834, 0.00036889687180519104, 0.0003836527466773987, 0.0003984086215496063, 0.00041316449642181396, 0.0004279203712940216, 0.00044267624616622925, 0.0004574321210384369, 0.00047218799591064453]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 8.0, 8.0, 9.0, 9.0, 14.0, 14.0, 25.0, 23.0, 34.0, 46.0, 46.0, 40.0, 46.0, 50.0, 55.0, 39.0, 36.0, 46.0, 54.0, 41.0, 44.0, 35.0, 32.0, 48.0, 36.0, 23.0, 20.0, 20.0, 18.0, 15.0, 12.0, 4.0, 9.0, 4.0, 12.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.16796875, -5.00970458984375, -4.8514404296875, -4.69317626953125, -4.534912109375, -4.37664794921875, -4.2183837890625, -4.06011962890625, -3.90185546875, -3.74359130859375, -3.5853271484375, -3.42706298828125, -3.268798828125, -3.11053466796875, -2.9522705078125, -2.79400634765625, -2.6357421875, -2.47747802734375, -2.3192138671875, -2.16094970703125, -2.002685546875, -1.84442138671875, -1.6861572265625, -1.52789306640625, -1.36962890625, -1.21136474609375, -1.0531005859375, -0.89483642578125, -0.736572265625, -0.57830810546875, -0.4200439453125, -0.26177978515625, -0.103515625, 0.05474853515625, 0.2130126953125, 0.37127685546875, 0.529541015625, 0.68780517578125, 0.8460693359375, 1.00433349609375, 1.16259765625, 1.32086181640625, 1.4791259765625, 1.63739013671875, 1.795654296875, 1.95391845703125, 2.1121826171875, 2.27044677734375, 2.4287109375, 2.58697509765625, 2.7452392578125, 2.90350341796875, 3.061767578125, 3.22003173828125, 3.3782958984375, 3.53656005859375, 3.69482421875, 3.85308837890625, 4.0113525390625, 4.16961669921875, 4.327880859375, 4.48614501953125, 4.6444091796875, 4.80267333984375, 4.9609375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 9.0, 7.0, 21.0, 30.0, 28.0, 38.0, 76.0, 90.0, 168.0, 240.0, 425.0, 739.0, 1494.0, 2794.0, 5419.0, 10302.0, 19674.0, 37582.0, 79369.0, 200567.0, 358969.0, 182696.0, 73334.0, 35331.0, 18432.0, 9734.0, 5196.0, 2689.0, 1357.0, 730.0, 406.0, 216.0, 114.0, 87.0, 57.0, 35.0, 22.0, 10.0, 16.0, 13.0, 6.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.03125, -3.903076171875, -3.77490234375, -3.646728515625, -3.5185546875, -3.390380859375, -3.26220703125, -3.134033203125, -3.005859375, -2.877685546875, -2.74951171875, -2.621337890625, -2.4931640625, -2.364990234375, -2.23681640625, -2.108642578125, -1.98046875, -1.852294921875, -1.72412109375, -1.595947265625, -1.4677734375, -1.339599609375, -1.21142578125, -1.083251953125, -0.955078125, -0.826904296875, -0.69873046875, -0.570556640625, -0.4423828125, -0.314208984375, -0.18603515625, -0.057861328125, 0.0703125, 0.198486328125, 0.32666015625, 0.454833984375, 0.5830078125, 0.711181640625, 0.83935546875, 0.967529296875, 1.095703125, 1.223876953125, 1.35205078125, 1.480224609375, 1.6083984375, 1.736572265625, 1.86474609375, 1.992919921875, 2.12109375, 2.249267578125, 2.37744140625, 2.505615234375, 2.6337890625, 2.761962890625, 2.89013671875, 3.018310546875, 3.146484375, 3.274658203125, 3.40283203125, 3.531005859375, 3.6591796875, 3.787353515625, 3.91552734375, 4.043701171875, 4.171875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 5.0, 9.0, 13.0, 14.0, 13.0, 14.0, 20.0, 23.0, 28.0, 33.0, 34.0, 40.0, 41.0, 53.0, 39.0, 64.0, 100.0, 166.0, 1510.0, 228.0, 127.0, 56.0, 53.0, 46.0, 43.0, 30.0, 41.0, 35.0, 29.0, 23.0, 22.0, 19.0, 19.0, 9.0, 10.0, 6.0, 9.0, 3.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.6474609375, -17.107421875, -16.5673828125, -16.02734375, -15.4873046875, -14.947265625, -14.4072265625, -13.8671875, -13.3271484375, -12.787109375, -12.2470703125, -11.70703125, -11.1669921875, -10.626953125, -10.0869140625, -9.546875, -9.0068359375, -8.466796875, -7.9267578125, -7.38671875, -6.8466796875, -6.306640625, -5.7666015625, -5.2265625, -4.6865234375, -4.146484375, -3.6064453125, -3.06640625, -2.5263671875, -1.986328125, -1.4462890625, -0.90625, -0.3662109375, 0.173828125, 0.7138671875, 1.25390625, 1.7939453125, 2.333984375, 2.8740234375, 3.4140625, 3.9541015625, 4.494140625, 5.0341796875, 5.57421875, 6.1142578125, 6.654296875, 7.1943359375, 7.734375, 8.2744140625, 8.814453125, 9.3544921875, 9.89453125, 10.4345703125, 10.974609375, 11.5146484375, 12.0546875, 12.5947265625, 13.134765625, 13.6748046875, 14.21484375, 14.7548828125, 15.294921875, 15.8349609375, 16.375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 6.0, 7.0, 13.0, 18.0, 18.0, 59.0, 99.0, 211.0, 586.0, 8588.0, 3132816.0, 2477.0, 411.0, 170.0, 84.0, 46.0, 31.0, 27.0, 9.0, 11.0, 7.0, 2.0, 4.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.3125, -113.1748046875, -109.037109375, -104.8994140625, -100.76171875, -96.6240234375, -92.486328125, -88.3486328125, -84.2109375, -80.0732421875, -75.935546875, -71.7978515625, -67.66015625, -63.5224609375, -59.384765625, -55.2470703125, -51.109375, -46.9716796875, -42.833984375, -38.6962890625, -34.55859375, -30.4208984375, -26.283203125, -22.1455078125, -18.0078125, -13.8701171875, -9.732421875, -5.5947265625, -1.45703125, 2.6806640625, 6.818359375, 10.9560546875, 15.09375, 19.2314453125, 23.369140625, 27.5068359375, 31.64453125, 35.7822265625, 39.919921875, 44.0576171875, 48.1953125, 52.3330078125, 56.470703125, 60.6083984375, 64.74609375, 68.8837890625, 73.021484375, 77.1591796875, 81.296875, 85.4345703125, 89.572265625, 93.7099609375, 97.84765625, 101.9853515625, 106.123046875, 110.2607421875, 114.3984375, 118.5361328125, 122.673828125, 126.8115234375, 130.94921875, 135.0869140625, 139.224609375, 143.3623046875, 147.5]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1010.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.05943298339844, -64.73582458496094, -46.41221237182617, -28.088600158691406, -9.764991760253906, 8.558616638183594, 26.882232666015625, 45.205841064453125, 63.529449462890625, 81.85305786132812, 100.17666625976562, 118.50028228759766, 136.82388305664062, 155.14749145507812, 173.4711151123047, 191.7947235107422, 210.1183319091797, 228.4419403076172, 246.7655487060547, 265.08917236328125, 283.41278076171875, 301.73638916015625, 320.05999755859375, 338.38360595703125, 356.70721435546875, 375.03082275390625, 393.35443115234375, 411.67803955078125, 430.00164794921875, 448.32525634765625, 466.64886474609375, 484.97247314453125, 503.29608154296875, 521.6196899414062, 539.9432983398438, 558.2669067382812, 576.5905151367188, 594.9141235351562, 613.2377319335938, 631.5613403320312, 649.8849487304688, 668.2085571289062, 686.5321655273438, 704.8557739257812, 723.1793823242188, 741.5029907226562, 759.8265991210938, 778.1502075195312, 796.473876953125, 814.7974853515625, 833.12109375, 851.4447021484375, 869.768310546875, 888.0919189453125, 906.41552734375, 924.7391357421875, 943.062744140625, 961.3863525390625, 979.7099609375, 998.0335693359375, 1016.357177734375, 1034.6807861328125, 1053.00439453125, 1071.3280029296875, 1089.651611328125]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 13.0, 6.0, 12.0, 17.0, 21.0, 17.0, 23.0, 25.0, 30.0, 30.0, 22.0, 26.0, 30.0, 42.0, 39.0, 44.0, 49.0, 28.0, 44.0, 45.0, 41.0, 42.0, 56.0, 34.0, 30.0, 29.0, 23.0, 34.0, 13.0, 21.0, 10.0, 16.0, 12.0, 12.0, 10.0, 5.0, 14.0, 9.0, 5.0, 6.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.9068717956543, -41.4150390625, -39.92321014404297, -38.43137741088867, -36.939544677734375, -35.44771194458008, -33.95587921142578, -32.46405029296875, -30.972217559814453, -29.480384826660156, -27.988554000854492, -26.496723175048828, -25.00489044189453, -23.513057708740234, -22.02122688293457, -20.529396057128906, -19.03756332397461, -17.545730590820312, -16.05389976501465, -14.562067985534668, -13.070236206054688, -11.578404426574707, -10.086572647094727, -8.594740867614746, -7.102909088134766, -5.611077308654785, -4.119245529174805, -2.627413749694824, -1.1355819702148438, 0.3562498092651367, 1.8480815887451172, 3.3399133682250977, 4.8317413330078125, 6.323573112487793, 7.815404891967773, 9.307236671447754, 10.799068450927734, 12.290900230407715, 13.782732009887695, 15.274563789367676, 16.766395568847656, 18.258228302001953, 19.750059127807617, 21.24188995361328, 22.733722686767578, 24.225555419921875, 25.71738624572754, 27.209217071533203, 28.7010498046875, 30.192882537841797, 31.68471336364746, 33.176544189453125, 34.66837692260742, 36.16020965576172, 37.65203857421875, 39.14387130737305, 40.635704040527344, 42.12753677368164, 43.61936950683594, 45.11119842529297, 46.603031158447266, 48.09486389160156, 49.586692810058594, 51.07852554321289, 52.57035827636719]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 10.0, 9.0, 6.0, 10.0, 13.0, 19.0, 21.0, 15.0, 28.0, 39.0, 45.0, 40.0, 48.0, 43.0, 50.0, 37.0, 52.0, 48.0, 38.0, 57.0, 40.0, 41.0, 40.0, 30.0, 39.0, 31.0, 26.0, 23.0, 17.0, 19.0, 13.0, 12.0, 4.0, 9.0, 5.0, 5.0, 5.0, 6.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.3433837890625, -5.167236328125, -4.9910888671875, -4.81494140625, -4.6387939453125, -4.462646484375, -4.2864990234375, -4.1103515625, -3.9342041015625, -3.758056640625, -3.5819091796875, -3.40576171875, -3.2296142578125, -3.053466796875, -2.8773193359375, -2.701171875, -2.5250244140625, -2.348876953125, -2.1727294921875, -1.99658203125, -1.8204345703125, -1.644287109375, -1.4681396484375, -1.2919921875, -1.1158447265625, -0.939697265625, -0.7635498046875, -0.58740234375, -0.4112548828125, -0.235107421875, -0.0589599609375, 0.1171875, 0.2933349609375, 0.469482421875, 0.6456298828125, 0.82177734375, 0.9979248046875, 1.174072265625, 1.3502197265625, 1.5263671875, 1.7025146484375, 1.878662109375, 2.0548095703125, 2.23095703125, 2.4071044921875, 2.583251953125, 2.7593994140625, 2.935546875, 3.1116943359375, 3.287841796875, 3.4639892578125, 3.64013671875, 3.8162841796875, 3.992431640625, 4.1685791015625, 4.3447265625, 4.5208740234375, 4.697021484375, 4.8731689453125, 5.04931640625, 5.2254638671875, 5.401611328125, 5.5777587890625, 5.75390625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 7.0, 5.0, 6.0, 11.0, 16.0, 17.0, 24.0, 28.0, 34.0, 49.0, 72.0, 131.0, 224.0, 421.0, 872.0, 2667.0, 10212.0, 52793.0, 326256.0, 1440286.0, 1773679.0, 487036.0, 78908.0, 14649.0, 3577.0, 1108.0, 486.0, 232.0, 156.0, 92.0, 67.0, 45.0, 33.0, 18.0, 12.0, 11.0, 11.0, 7.0, 5.0, 8.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.8082275390625, -7.530517578125, -7.2528076171875, -6.97509765625, -6.6973876953125, -6.419677734375, -6.1419677734375, -5.8642578125, -5.5865478515625, -5.308837890625, -5.0311279296875, -4.75341796875, -4.4757080078125, -4.197998046875, -3.9202880859375, -3.642578125, -3.3648681640625, -3.087158203125, -2.8094482421875, -2.53173828125, -2.2540283203125, -1.976318359375, -1.6986083984375, -1.4208984375, -1.1431884765625, -0.865478515625, -0.5877685546875, -0.31005859375, -0.0323486328125, 0.245361328125, 0.5230712890625, 0.80078125, 1.0784912109375, 1.356201171875, 1.6339111328125, 1.91162109375, 2.1893310546875, 2.467041015625, 2.7447509765625, 3.0224609375, 3.3001708984375, 3.577880859375, 3.8555908203125, 4.13330078125, 4.4110107421875, 4.688720703125, 4.9664306640625, 5.244140625, 5.5218505859375, 5.799560546875, 6.0772705078125, 6.35498046875, 6.6326904296875, 6.910400390625, 7.1881103515625, 7.4658203125, 7.7435302734375, 8.021240234375, 8.2989501953125, 8.57666015625, 8.8543701171875, 9.132080078125, 9.4097900390625, 9.6875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 15.0, 15.0, 40.0, 43.0, 74.0, 100.0, 117.0, 154.0, 226.0, 347.0, 436.0, 483.0, 473.0, 418.0, 289.0, 255.0, 174.0, 129.0, 79.0, 53.0, 45.0, 28.0, 22.0, 20.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0], "bins": [-16.671875, -16.2647705078125, -15.857666015625, -15.4505615234375, -15.04345703125, -14.6363525390625, -14.229248046875, -13.8221435546875, -13.4150390625, -13.0079345703125, -12.600830078125, -12.1937255859375, -11.78662109375, -11.3795166015625, -10.972412109375, -10.5653076171875, -10.158203125, -9.7510986328125, -9.343994140625, -8.9368896484375, -8.52978515625, -8.1226806640625, -7.715576171875, -7.3084716796875, -6.9013671875, -6.4942626953125, -6.087158203125, -5.6800537109375, -5.27294921875, -4.8658447265625, -4.458740234375, -4.0516357421875, -3.64453125, -3.2374267578125, -2.830322265625, -2.4232177734375, -2.01611328125, -1.6090087890625, -1.201904296875, -0.7947998046875, -0.3876953125, 0.0194091796875, 0.426513671875, 0.8336181640625, 1.24072265625, 1.6478271484375, 2.054931640625, 2.4620361328125, 2.869140625, 3.2762451171875, 3.683349609375, 4.0904541015625, 4.49755859375, 4.9046630859375, 5.311767578125, 5.7188720703125, 6.1259765625, 6.5330810546875, 6.940185546875, 7.3472900390625, 7.75439453125, 8.1614990234375, 8.568603515625, 8.9757080078125, 9.3828125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 10.0, 6.0, 6.0, 14.0, 21.0, 37.0, 40.0, 50.0, 83.0, 114.0, 179.0, 308.0, 565.0, 1800.0, 11783.0, 259744.0, 3233560.0, 656456.0, 25142.0, 2624.0, 702.0, 351.0, 223.0, 146.0, 99.0, 72.0, 50.0, 35.0, 15.0, 17.0, 15.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.078125, -19.294921875, -18.51171875, -17.728515625, -16.9453125, -16.162109375, -15.37890625, -14.595703125, -13.8125, -13.029296875, -12.24609375, -11.462890625, -10.6796875, -9.896484375, -9.11328125, -8.330078125, -7.546875, -6.763671875, -5.98046875, -5.197265625, -4.4140625, -3.630859375, -2.84765625, -2.064453125, -1.28125, -0.498046875, 0.28515625, 1.068359375, 1.8515625, 2.634765625, 3.41796875, 4.201171875, 4.984375, 5.767578125, 6.55078125, 7.333984375, 8.1171875, 8.900390625, 9.68359375, 10.466796875, 11.25, 12.033203125, 12.81640625, 13.599609375, 14.3828125, 15.166015625, 15.94921875, 16.732421875, 17.515625, 18.298828125, 19.08203125, 19.865234375, 20.6484375, 21.431640625, 22.21484375, 22.998046875, 23.78125, 24.564453125, 25.34765625, 26.130859375, 26.9140625, 27.697265625, 28.48046875, 29.263671875, 30.046875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 12.0, 29.0, 74.0, 167.0, 211.0, 225.0, 166.0, 70.0, 35.0, 13.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.85086059570312, -130.50595092773438, -127.16104888916016, -123.8161392211914, -120.47123718261719, -117.12632751464844, -113.78141784667969, -110.43650817871094, -107.09160614013672, -103.74669647216797, -100.40179443359375, -97.056884765625, -93.71197509765625, -90.36707305908203, -87.02216339111328, -83.67726135253906, -80.33235168457031, -76.98744201660156, -73.64253997802734, -70.2976303100586, -66.95272827148438, -63.607818603515625, -60.262908935546875, -56.91800308227539, -53.573097229003906, -50.22819137573242, -46.88328552246094, -43.53837585449219, -40.1934700012207, -36.84856414794922, -33.50365447998047, -30.158748626708984, -26.81383514404297, -23.468929290771484, -20.124021530151367, -16.77911376953125, -13.434207916259766, -10.089302062988281, -6.744394302368164, -3.399486541748047, -0.0545806884765625, 3.2903261184692383, 6.635232925415039, 9.98013973236084, 13.32504653930664, 16.669952392578125, 20.014860153198242, 23.35976791381836, 26.704673767089844, 30.049579620361328, 33.39448547363281, 36.73939514160156, 40.08430099487305, 43.42920684814453, 46.77411651611328, 50.119022369384766, 53.46392822265625, 56.808834075927734, 60.15373992919922, 63.49864959716797, 66.84355163574219, 70.18846130371094, 73.53337097167969, 76.87828063964844, 80.22318267822266]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 2.0, 5.0, 17.0, 10.0, 13.0, 22.0, 15.0, 20.0, 13.0, 26.0, 38.0, 47.0, 34.0, 44.0, 37.0, 50.0, 48.0, 50.0, 39.0, 30.0, 67.0, 44.0, 48.0, 26.0, 44.0, 31.0, 33.0, 24.0, 23.0, 21.0, 19.0, 12.0, 8.0, 7.0, 11.0, 7.0, 0.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.96455383300781, -41.62192153930664, -40.27928924560547, -38.9366569519043, -37.594024658203125, -36.25139236450195, -34.90876007080078, -33.56612777709961, -32.22349548339844, -30.880863189697266, -29.538230895996094, -28.195598602294922, -26.85296630859375, -25.510334014892578, -24.167701721191406, -22.825069427490234, -21.48243522644043, -20.139802932739258, -18.797170639038086, -17.454538345336914, -16.111906051635742, -14.76927375793457, -13.426640510559082, -12.08400821685791, -10.741375923156738, -9.398743629455566, -8.056111335754395, -6.7134785652160645, -5.370846271514893, -4.028213977813721, -2.6855812072753906, -1.3429489135742188, -0.000316619873046875, 1.3423157930374146, 2.684948205947876, 4.027580738067627, 5.370213031768799, 6.712845325469971, 8.0554780960083, 9.398110389709473, 10.740742683410645, 12.083374977111816, 13.426007270812988, 14.768640518188477, 16.11127281188965, 17.45390510559082, 18.796537399291992, 20.139169692993164, 21.481801986694336, 22.824434280395508, 24.16706657409668, 25.50969886779785, 26.852331161499023, 28.194963455200195, 29.53759765625, 30.880229949951172, 32.222862243652344, 33.565494537353516, 34.90812683105469, 36.25075912475586, 37.59339141845703, 38.9360237121582, 40.278656005859375, 41.62128829956055, 42.96392059326172]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 10.0, 6.0, 11.0, 10.0, 15.0, 16.0, 17.0, 18.0, 31.0, 35.0, 43.0, 51.0, 44.0, 44.0, 61.0, 57.0, 51.0, 61.0, 47.0, 61.0, 53.0, 37.0, 41.0, 26.0, 32.0, 30.0, 17.0, 19.0, 9.0, 16.0, 10.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.2442626953125, -5.047119140625, -4.8499755859375, -4.65283203125, -4.4556884765625, -4.258544921875, -4.0614013671875, -3.8642578125, -3.6671142578125, -3.469970703125, -3.2728271484375, -3.07568359375, -2.8785400390625, -2.681396484375, -2.4842529296875, -2.287109375, -2.0899658203125, -1.892822265625, -1.6956787109375, -1.49853515625, -1.3013916015625, -1.104248046875, -0.9071044921875, -0.7099609375, -0.5128173828125, -0.315673828125, -0.1185302734375, 0.07861328125, 0.2757568359375, 0.472900390625, 0.6700439453125, 0.8671875, 1.0643310546875, 1.261474609375, 1.4586181640625, 1.65576171875, 1.8529052734375, 2.050048828125, 2.2471923828125, 2.4443359375, 2.6414794921875, 2.838623046875, 3.0357666015625, 3.23291015625, 3.4300537109375, 3.627197265625, 3.8243408203125, 4.021484375, 4.2186279296875, 4.415771484375, 4.6129150390625, 4.81005859375, 5.0072021484375, 5.204345703125, 5.4014892578125, 5.5986328125, 5.7957763671875, 5.992919921875, 6.1900634765625, 6.38720703125, 6.5843505859375, 6.781494140625, 6.9786376953125, 7.17578125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 7.0, 23.0, 39.0, 37.0, 57.0, 94.0, 162.0, 267.0, 454.0, 773.0, 1185.0, 1935.0, 3150.0, 4946.0, 7893.0, 12423.0, 19887.0, 32261.0, 52527.0, 87862.0, 146994.0, 213330.0, 180149.0, 110635.0, 65979.0, 39724.0, 24679.0, 15202.0, 9581.0, 6207.0, 3875.0, 2363.0, 1516.0, 907.0, 569.0, 340.0, 189.0, 112.0, 85.0, 45.0, 34.0, 17.0, 13.0, 6.0, 11.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39794921875, -0.38455963134765625, -0.3711700439453125, -0.35778045654296875, -0.344390869140625, -0.33100128173828125, -0.3176116943359375, -0.30422210693359375, -0.29083251953125, -0.27744293212890625, -0.2640533447265625, -0.25066375732421875, -0.237274169921875, -0.22388458251953125, -0.2104949951171875, -0.19710540771484375, -0.1837158203125, -0.17032623291015625, -0.1569366455078125, -0.14354705810546875, -0.130157470703125, -0.11676788330078125, -0.1033782958984375, -0.08998870849609375, -0.07659912109375, -0.06320953369140625, -0.0498199462890625, -0.03643035888671875, -0.023040771484375, -0.00965118408203125, 0.0037384033203125, 0.01712799072265625, 0.030517578125, 0.04390716552734375, 0.0572967529296875, 0.07068634033203125, 0.084075927734375, 0.09746551513671875, 0.1108551025390625, 0.12424468994140625, 0.13763427734375, 0.15102386474609375, 0.1644134521484375, 0.17780303955078125, 0.191192626953125, 0.20458221435546875, 0.2179718017578125, 0.23136138916015625, 0.2447509765625, 0.25814056396484375, 0.2715301513671875, 0.28491973876953125, 0.298309326171875, 0.31169891357421875, 0.3250885009765625, 0.33847808837890625, 0.35186767578125, 0.36525726318359375, 0.3786468505859375, 0.39203643798828125, 0.405426025390625, 0.41881561279296875, 0.4322052001953125, 0.44559478759765625, 0.458984375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 8.0, 5.0, 13.0, 14.0, 18.0, 13.0, 11.0, 30.0, 27.0, 19.0, 29.0, 28.0, 31.0, 30.0, 47.0, 44.0, 31.0, 29.0, 48.0, 1068.0, 31.0, 29.0, 40.0, 39.0, 28.0, 37.0, 33.0, 28.0, 29.0, 20.0, 26.0, 20.0, 18.0, 19.0, 9.0, 15.0, 8.0, 10.0, 8.0, 5.0, 2.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0], "bins": [-3.005859375, -2.915618896484375, -2.82537841796875, -2.735137939453125, -2.6448974609375, -2.554656982421875, -2.46441650390625, -2.374176025390625, -2.283935546875, -2.193695068359375, -2.10345458984375, -2.013214111328125, -1.9229736328125, -1.832733154296875, -1.74249267578125, -1.652252197265625, -1.56201171875, -1.471771240234375, -1.38153076171875, -1.291290283203125, -1.2010498046875, -1.110809326171875, -1.02056884765625, -0.930328369140625, -0.840087890625, -0.749847412109375, -0.65960693359375, -0.569366455078125, -0.4791259765625, -0.388885498046875, -0.29864501953125, -0.208404541015625, -0.1181640625, -0.027923583984375, 0.06231689453125, 0.152557373046875, 0.2427978515625, 0.333038330078125, 0.42327880859375, 0.513519287109375, 0.603759765625, 0.694000244140625, 0.78424072265625, 0.874481201171875, 0.9647216796875, 1.054962158203125, 1.14520263671875, 1.235443115234375, 1.32568359375, 1.415924072265625, 1.50616455078125, 1.596405029296875, 1.6866455078125, 1.776885986328125, 1.86712646484375, 1.957366943359375, 2.047607421875, 2.137847900390625, 2.22808837890625, 2.318328857421875, 2.4085693359375, 2.498809814453125, 2.58905029296875, 2.679290771484375, 2.76953125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 25.0, 26.0, 31.0, 48.0, 66.0, 121.0, 189.0, 254.0, 433.0, 580.0, 881.0, 1380.0, 2068.0, 3244.0, 4604.0, 7033.0, 10599.0, 16028.0, 24199.0, 36805.0, 56416.0, 85671.0, 125445.0, 1200836.0, 170210.0, 118124.0, 79045.0, 52341.0, 33959.0, 22361.0, 14738.0, 9994.0, 6523.0, 4244.0, 2894.0, 1924.0, 1267.0, 871.0, 562.0, 395.0, 247.0, 154.0, 106.0, 59.0, 44.0, 31.0, 12.0, 15.0, 11.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.29150390625, -0.2823677062988281, -0.27323150634765625, -0.2640953063964844, -0.2549591064453125, -0.24582290649414062, -0.23668670654296875, -0.22755050659179688, -0.218414306640625, -0.20927810668945312, -0.20014190673828125, -0.19100570678710938, -0.1818695068359375, -0.17273330688476562, -0.16359710693359375, -0.15446090698242188, -0.14532470703125, -0.13618850708007812, -0.12705230712890625, -0.11791610717773438, -0.1087799072265625, -0.09964370727539062, -0.09050750732421875, -0.08137130737304688, -0.072235107421875, -0.06309890747070312, -0.05396270751953125, -0.044826507568359375, -0.0356903076171875, -0.026554107666015625, -0.01741790771484375, -0.008281707763671875, 0.0008544921875, 0.009990692138671875, 0.01912689208984375, 0.028263092041015625, 0.0373992919921875, 0.046535491943359375, 0.05567169189453125, 0.06480789184570312, 0.073944091796875, 0.08308029174804688, 0.09221649169921875, 0.10135269165039062, 0.1104888916015625, 0.11962509155273438, 0.12876129150390625, 0.13789749145507812, 0.14703369140625, 0.15616989135742188, 0.16530609130859375, 0.17444229125976562, 0.1835784912109375, 0.19271469116210938, 0.20185089111328125, 0.21098709106445312, 0.220123291015625, 0.22925949096679688, 0.23839569091796875, 0.24753189086914062, 0.2566680908203125, 0.2658042907714844, 0.27494049072265625, 0.2840766906738281, 0.293212890625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 6.0, 5.0, 4.0, 5.0, 10.0, 13.0, 14.0, 18.0, 17.0, 29.0, 26.0, 32.0, 42.0, 60.0, 37.0, 42.0, 51.0, 55.0, 62.0, 48.0, 55.0, 57.0, 30.0, 40.0, 44.0, 34.0, 29.0, 20.0, 23.0, 22.0, 14.0, 9.0, 15.0, 5.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001247406005859375, -0.0012080371379852295, -0.001168668270111084, -0.0011292994022369385, -0.001089930534362793, -0.0010505616664886475, -0.001011192798614502, -0.0009718239307403564, -0.0009324550628662109, -0.0008930861949920654, -0.0008537173271179199, -0.0008143484592437744, -0.0007749795913696289, -0.0007356107234954834, -0.0006962418556213379, -0.0006568729877471924, -0.0006175041198730469, -0.0005781352519989014, -0.0005387663841247559, -0.0004993975162506104, -0.00046002864837646484, -0.00042065978050231934, -0.00038129091262817383, -0.0003419220447540283, -0.0003025531768798828, -0.0002631843090057373, -0.0002238154411315918, -0.0001844465732574463, -0.00014507770538330078, -0.00010570883750915527, -6.633996963500977e-05, -2.6971101760864258e-05, 1.239776611328125e-05, 5.176663398742676e-05, 9.113550186157227e-05, 0.00013050436973571777, 0.00016987323760986328, 0.0002092421054840088, 0.0002486109733581543, 0.0002879798412322998, 0.0003273487091064453, 0.0003667175769805908, 0.00040608644485473633, 0.00044545531272888184, 0.00048482418060302734, 0.0005241930484771729, 0.0005635619163513184, 0.0006029307842254639, 0.0006422996520996094, 0.0006816685199737549, 0.0007210373878479004, 0.0007604062557220459, 0.0007997751235961914, 0.0008391439914703369, 0.0008785128593444824, 0.0009178817272186279, 0.0009572505950927734, 0.000996619462966919, 0.0010359883308410645, 0.00107535719871521, 0.0011147260665893555, 0.001154094934463501, 0.0011934638023376465, 0.001232832670211792, 0.0012722015380859375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 9.0, 8.0, 16.0, 20.0, 10.0, 30.0, 30.0, 39.0, 50.0, 78.0, 138.0, 213.0, 358.0, 790.0, 6090.0, 992427.0, 45939.0, 1045.0, 496.0, 232.0, 158.0, 99.0, 63.0, 48.0, 35.0, 31.0, 16.0, 16.0, 12.0, 8.0, 9.0, 5.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025909423828125, -0.025091171264648438, -0.024272918701171875, -0.023454666137695312, -0.02263641357421875, -0.021818161010742188, -0.020999908447265625, -0.020181655883789062, -0.0193634033203125, -0.018545150756835938, -0.017726898193359375, -0.016908645629882812, -0.01609039306640625, -0.015272140502929688, -0.014453887939453125, -0.013635635375976562, -0.0128173828125, -0.011999130249023438, -0.011180877685546875, -0.010362625122070312, -0.00954437255859375, -0.008726119995117188, -0.007907867431640625, -0.0070896148681640625, -0.0062713623046875, -0.0054531097412109375, -0.004634857177734375, -0.0038166046142578125, -0.00299835205078125, -0.0021800994873046875, -0.001361846923828125, -0.0005435943603515625, 0.000274658203125, 0.0010929107666015625, 0.001911163330078125, 0.0027294158935546875, 0.00354766845703125, 0.0043659210205078125, 0.005184173583984375, 0.0060024261474609375, 0.0068206787109375, 0.0076389312744140625, 0.008457183837890625, 0.009275436401367188, 0.01009368896484375, 0.010911941528320312, 0.011730194091796875, 0.012548446655273438, 0.01336669921875, 0.014184951782226562, 0.015003204345703125, 0.015821456909179688, 0.01663970947265625, 0.017457962036132812, 0.018276214599609375, 0.019094467163085938, 0.0199127197265625, 0.020730972290039062, 0.021549224853515625, 0.022367477416992188, 0.02318572998046875, 0.024003982543945312, 0.024822235107421875, 0.025640487670898438, 0.026458740234375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 23.0, 110.0, 396.0, 343.0, 117.0, 17.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004974533338099718, -0.0048685637302696705, -0.004762594122439623, -0.004656624980270863, -0.004550655372440815, -0.004444685764610767, -0.00433871615678072, -0.0042327470146119595, -0.004126777406781912, -0.004020807798951864, -0.003914838191121817, -0.0038088688161224127, -0.0037028994411230087, -0.003596929833292961, -0.003490960458293557, -0.0033849908504635096, -0.0032790214754641056, -0.003173051867634058, -0.003067082492634654, -0.0029611128848046064, -0.0028551435098052025, -0.002749173901975155, -0.002643204526975751, -0.0025372349191457033, -0.0024312653113156557, -0.002325295703485608, -0.002219326328486204, -0.0021133567206561565, -0.0020073873456567526, -0.001901417737826705, -0.001795448362827301, -0.0016894787549972534, -0.0015835093799978495, -0.0014775398885831237, -0.001371570397168398, -0.0012656009057536721, -0.0011596314143389463, -0.0010536618065088987, -0.0009476923733018339, -0.0008417228818871081, -0.0007357533904723823, -0.0006297838990576565, -0.0005238144076429307, -0.0004178448871243745, -0.00031187539570964873, -0.0002059058751910925, -9.993638377636671e-05, 6.03310763835907e-06, 0.00011200259905308485, 0.00021797209046781063, 0.0003239415818825364, 0.00042991110240109265, 0.000535880564711988, 0.0006418501143343747, 0.0007478196057491004, 0.0008537890971638262, 0.000959758588578552, 0.0010657281382009387, 0.0011716976296156645, 0.0012776671210303903, 0.001383636612445116, 0.0014896061038598418, 0.0015955755952745676, 0.0017015450866892934, 0.0018075145781040192]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 6.0, 9.0, 10.0, 7.0, 13.0, 11.0, 22.0, 23.0, 24.0, 30.0, 37.0, 32.0, 31.0, 41.0, 43.0, 49.0, 39.0, 28.0, 45.0, 46.0, 50.0, 41.0, 38.0, 39.0, 31.0, 35.0, 38.0, 26.0, 15.0, 18.0, 27.0, 18.0, 16.0, 11.0, 9.0, 5.0, 7.0, 6.0, 4.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006800293922424316, -0.0006577242165803909, -0.0006354190409183502, -0.0006131138652563095, -0.0005908086895942688, -0.0005685035139322281, -0.0005461983382701874, -0.0005238931626081467, -0.000501587986946106, -0.00047928281128406525, -0.00045697763562202454, -0.0004346724599599838, -0.0004123672842979431, -0.0003900621086359024, -0.0003677569329738617, -0.000345451757311821, -0.0003231465816497803, -0.00030084140598773956, -0.00027853623032569885, -0.00025623105466365814, -0.00023392587900161743, -0.00021162070333957672, -0.000189315527677536, -0.0001670103520154953, -0.0001447051763534546, -0.00012240000069141388, -0.00010009482502937317, -7.778964936733246e-05, -5.548447370529175e-05, -3.317929804325104e-05, -1.0874122381210327e-05, 1.1431053280830383e-05, 3.3736228942871094e-05, 5.6041404604911804e-05, 7.834658026695251e-05, 0.00010065175592899323, 0.00012295693159103394, 0.00014526210725307465, 0.00016756728291511536, 0.00018987245857715607, 0.00021217763423919678, 0.0002344828099012375, 0.0002567879855632782, 0.0002790931612253189, 0.0003013983368873596, 0.00032370351254940033, 0.00034600868821144104, 0.00036831386387348175, 0.00039061903953552246, 0.00041292421519756317, 0.0004352293908596039, 0.0004575345665216446, 0.0004798397421836853, 0.000502144917845726, 0.0005244500935077667, 0.0005467552691698074, 0.0005690604448318481, 0.0005913656204938889, 0.0006136707961559296, 0.0006359759718179703, 0.000658281147480011, 0.0006805863231420517, 0.0007028914988040924, 0.0007251966744661331, 0.0007475018501281738]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 10.0, 6.0, 11.0, 10.0, 15.0, 16.0, 17.0, 18.0, 31.0, 35.0, 43.0, 51.0, 44.0, 44.0, 61.0, 57.0, 51.0, 61.0, 47.0, 61.0, 53.0, 37.0, 41.0, 26.0, 32.0, 30.0, 17.0, 19.0, 9.0, 16.0, 10.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.2442626953125, -5.047119140625, -4.8499755859375, -4.65283203125, -4.4556884765625, -4.258544921875, -4.0614013671875, -3.8642578125, -3.6671142578125, -3.469970703125, -3.2728271484375, -3.07568359375, -2.8785400390625, -2.681396484375, -2.4842529296875, -2.287109375, -2.0899658203125, -1.892822265625, -1.6956787109375, -1.49853515625, -1.3013916015625, -1.104248046875, -0.9071044921875, -0.7099609375, -0.5128173828125, -0.315673828125, -0.1185302734375, 0.07861328125, 0.2757568359375, 0.472900390625, 0.6700439453125, 0.8671875, 1.0643310546875, 1.261474609375, 1.4586181640625, 1.65576171875, 1.8529052734375, 2.050048828125, 2.2471923828125, 2.4443359375, 2.6414794921875, 2.838623046875, 3.0357666015625, 3.23291015625, 3.4300537109375, 3.627197265625, 3.8243408203125, 4.021484375, 4.2186279296875, 4.415771484375, 4.6129150390625, 4.81005859375, 5.0072021484375, 5.204345703125, 5.4014892578125, 5.5986328125, 5.7957763671875, 5.992919921875, 6.1900634765625, 6.38720703125, 6.5843505859375, 6.781494140625, 6.9786376953125, 7.17578125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 19.0, 15.0, 39.0, 37.0, 78.0, 129.0, 181.0, 348.0, 597.0, 1159.0, 2285.0, 4629.0, 9310.0, 18906.0, 38038.0, 76955.0, 156197.0, 272724.0, 230338.0, 119022.0, 59093.0, 29239.0, 14818.0, 7147.0, 3438.0, 1797.0, 822.0, 473.0, 262.0, 159.0, 97.0, 57.0, 46.0, 36.0, 20.0, 9.0, 14.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.01171875, -4.87176513671875, -4.7318115234375, -4.59185791015625, -4.451904296875, -4.31195068359375, -4.1719970703125, -4.03204345703125, -3.89208984375, -3.75213623046875, -3.6121826171875, -3.47222900390625, -3.332275390625, -3.19232177734375, -3.0523681640625, -2.91241455078125, -2.7724609375, -2.63250732421875, -2.4925537109375, -2.35260009765625, -2.212646484375, -2.07269287109375, -1.9327392578125, -1.79278564453125, -1.65283203125, -1.51287841796875, -1.3729248046875, -1.23297119140625, -1.093017578125, -0.95306396484375, -0.8131103515625, -0.67315673828125, -0.533203125, -0.39324951171875, -0.2532958984375, -0.11334228515625, 0.026611328125, 0.16656494140625, 0.3065185546875, 0.44647216796875, 0.58642578125, 0.72637939453125, 0.8663330078125, 1.00628662109375, 1.146240234375, 1.28619384765625, 1.4261474609375, 1.56610107421875, 1.7060546875, 1.84600830078125, 1.9859619140625, 2.12591552734375, 2.265869140625, 2.40582275390625, 2.5457763671875, 2.68572998046875, 2.82568359375, 2.96563720703125, 3.1055908203125, 3.24554443359375, 3.385498046875, 3.52545166015625, 3.6654052734375, 3.80535888671875, 3.9453125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 7.0, 8.0, 10.0, 10.0, 11.0, 11.0, 23.0, 28.0, 25.0, 40.0, 36.0, 49.0, 56.0, 64.0, 76.0, 121.0, 243.0, 1464.0, 223.0, 127.0, 72.0, 61.0, 43.0, 41.0, 34.0, 26.0, 24.0, 20.0, 13.0, 17.0, 13.0, 8.0, 9.0, 9.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-24.03125, -23.353515625, -22.67578125, -21.998046875, -21.3203125, -20.642578125, -19.96484375, -19.287109375, -18.609375, -17.931640625, -17.25390625, -16.576171875, -15.8984375, -15.220703125, -14.54296875, -13.865234375, -13.1875, -12.509765625, -11.83203125, -11.154296875, -10.4765625, -9.798828125, -9.12109375, -8.443359375, -7.765625, -7.087890625, -6.41015625, -5.732421875, -5.0546875, -4.376953125, -3.69921875, -3.021484375, -2.34375, -1.666015625, -0.98828125, -0.310546875, 0.3671875, 1.044921875, 1.72265625, 2.400390625, 3.078125, 3.755859375, 4.43359375, 5.111328125, 5.7890625, 6.466796875, 7.14453125, 7.822265625, 8.5, 9.177734375, 9.85546875, 10.533203125, 11.2109375, 11.888671875, 12.56640625, 13.244140625, 13.921875, 14.599609375, 15.27734375, 15.955078125, 16.6328125, 17.310546875, 17.98828125, 18.666015625, 19.34375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 12.0, 14.0, 16.0, 30.0, 31.0, 47.0, 83.0, 124.0, 193.0, 342.0, 748.0, 7220.0, 3118618.0, 16294.0, 932.0, 398.0, 212.0, 131.0, 82.0, 55.0, 33.0, 25.0, 19.0, 16.0, 10.0, 8.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -63.9375, -61.4375, -58.9375, -56.4375, -53.9375, -51.4375, -48.9375, -46.4375, -43.9375, -41.4375, -38.9375, -36.4375, -33.9375, -31.4375, -28.9375, -26.4375, -23.9375, -21.4375, -18.9375, -16.4375, -13.9375, -11.4375, -8.9375, -6.4375, -3.9375, -1.4375, 1.0625, 3.5625, 6.0625, 8.5625, 11.0625, 13.5625, 16.0625, 18.5625, 21.0625, 23.5625, 26.0625, 28.5625, 31.0625, 33.5625, 36.0625, 38.5625, 41.0625, 43.5625, 46.0625, 48.5625, 51.0625, 53.5625, 56.0625, 58.5625, 61.0625, 63.5625, 66.0625, 68.5625, 71.0625, 73.5625, 76.0625, 78.5625, 81.0625, 83.5625, 86.0625, 88.5625, 91.0625, 93.5625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 43.0, 200.0, 419.0, 278.0, 60.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.42967224121094, -149.29757690429688, -146.16549682617188, -143.0334014892578, -139.9013214111328, -136.76922607421875, -133.63714599609375, -130.5050506591797, -127.37297058105469, -124.24088287353516, -121.10879516601562, -117.9767074584961, -114.84461975097656, -111.71253204345703, -108.5804443359375, -105.44834899902344, -102.3162612915039, -99.18417358398438, -96.05208587646484, -92.91999816894531, -89.78791046142578, -86.65582275390625, -83.52372741699219, -80.39164733886719, -77.25955200195312, -74.1274642944336, -70.99537658691406, -67.86328887939453, -64.731201171875, -61.59911346435547, -58.46702194213867, -55.33493423461914, -52.20285415649414, -49.07076644897461, -45.93867874145508, -42.80658721923828, -39.67449951171875, -36.54241180419922, -33.41032409667969, -30.278236389160156, -27.146148681640625, -24.014060974121094, -20.881973266601562, -17.7498836517334, -14.617795944213867, -11.485708236694336, -8.353618621826172, -5.221530914306641, -2.0894432067871094, 1.04264497756958, 4.1747331619262695, 7.306821823120117, 10.438909530639648, 13.57099723815918, 16.703086853027344, 19.835174560546875, 22.967262268066406, 26.099349975585938, 29.23143768310547, 32.363525390625, 35.49561309814453, 38.62770080566406, 41.75979232788086, 44.89188003540039, 48.02396774291992]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 2.0, 7.0, 7.0, 13.0, 8.0, 11.0, 9.0, 13.0, 13.0, 22.0, 25.0, 18.0, 34.0, 21.0, 26.0, 19.0, 33.0, 32.0, 43.0, 32.0, 33.0, 32.0, 28.0, 40.0, 30.0, 41.0, 33.0, 41.0, 32.0, 30.0, 31.0, 22.0, 29.0, 23.0, 13.0, 20.0, 11.0, 21.0, 6.0, 6.0, 13.0, 10.0, 11.0, 9.0, 7.0, 7.0, 9.0, 3.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0], "bins": [-36.1612663269043, -34.994667053222656, -33.82807159423828, -32.66147232055664, -31.494876861572266, -30.328277587890625, -29.161680221557617, -27.99508285522461, -26.8284854888916, -25.661888122558594, -24.495290756225586, -23.328693389892578, -22.162094116210938, -20.995498657226562, -19.828899383544922, -18.662302017211914, -17.495704650878906, -16.3291072845459, -15.16250991821289, -13.995911598205566, -12.829314231872559, -11.66271686553955, -10.496118545532227, -9.329521179199219, -8.162923812866211, -6.996326446533203, -5.829728603363037, -4.663130760192871, -3.4965333938598633, -2.3299360275268555, -1.1633381843566895, 0.0032596588134765625, 1.1698570251464844, 2.3364546298980713, 3.503052234649658, 4.669650077819824, 5.836247444152832, 7.00284481048584, 8.169443130493164, 9.336040496826172, 10.50263786315918, 11.669235229492188, 12.835832595825195, 14.00243091583252, 15.169028282165527, 16.33562469482422, 17.50222396850586, 18.668821334838867, 19.835418701171875, 21.002016067504883, 22.16861343383789, 23.3352108001709, 24.501808166503906, 25.668407440185547, 26.835004806518555, 28.001602172851562, 29.16819953918457, 30.334796905517578, 31.501394271850586, 32.667991638183594, 33.834590911865234, 35.00118637084961, 36.16778564453125, 37.334381103515625, 38.500980377197266]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 11.0, 6.0, 9.0, 15.0, 12.0, 8.0, 23.0, 34.0, 22.0, 32.0, 34.0, 39.0, 49.0, 48.0, 55.0, 50.0, 58.0, 45.0, 59.0, 53.0, 56.0, 37.0, 38.0, 33.0, 32.0, 22.0, 24.0, 16.0, 16.0, 16.0, 9.0, 7.0, 13.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5546875, -5.3482666015625, -5.141845703125, -4.9354248046875, -4.72900390625, -4.5225830078125, -4.316162109375, -4.1097412109375, -3.9033203125, -3.6968994140625, -3.490478515625, -3.2840576171875, -3.07763671875, -2.8712158203125, -2.664794921875, -2.4583740234375, -2.251953125, -2.0455322265625, -1.839111328125, -1.6326904296875, -1.42626953125, -1.2198486328125, -1.013427734375, -0.8070068359375, -0.6005859375, -0.3941650390625, -0.187744140625, 0.0186767578125, 0.22509765625, 0.4315185546875, 0.637939453125, 0.8443603515625, 1.05078125, 1.2572021484375, 1.463623046875, 1.6700439453125, 1.87646484375, 2.0828857421875, 2.289306640625, 2.4957275390625, 2.7021484375, 2.9085693359375, 3.114990234375, 3.3214111328125, 3.52783203125, 3.7342529296875, 3.940673828125, 4.1470947265625, 4.353515625, 4.5599365234375, 4.766357421875, 4.9727783203125, 5.17919921875, 5.3856201171875, 5.592041015625, 5.7984619140625, 6.0048828125, 6.2113037109375, 6.417724609375, 6.6241455078125, 6.83056640625, 7.0369873046875, 7.243408203125, 7.4498291015625, 7.65625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 11.0, 6.0, 6.0, 10.0, 5.0, 10.0, 15.0, 15.0, 25.0, 22.0, 30.0, 27.0, 46.0, 69.0, 147.0, 377.0, 2019.0, 40141.0, 1761877.0, 2325088.0, 60943.0, 2506.0, 427.0, 146.0, 75.0, 49.0, 36.0, 18.0, 26.0, 22.0, 19.0, 19.0, 15.0, 7.0, 5.0, 9.0, 8.0, 3.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.96875, -17.3046875, -16.640625, -15.9765625, -15.3125, -14.6484375, -13.984375, -13.3203125, -12.65625, -11.9921875, -11.328125, -10.6640625, -10.0, -9.3359375, -8.671875, -8.0078125, -7.34375, -6.6796875, -6.015625, -5.3515625, -4.6875, -4.0234375, -3.359375, -2.6953125, -2.03125, -1.3671875, -0.703125, -0.0390625, 0.625, 1.2890625, 1.953125, 2.6171875, 3.28125, 3.9453125, 4.609375, 5.2734375, 5.9375, 6.6015625, 7.265625, 7.9296875, 8.59375, 9.2578125, 9.921875, 10.5859375, 11.25, 11.9140625, 12.578125, 13.2421875, 13.90625, 14.5703125, 15.234375, 15.8984375, 16.5625, 17.2265625, 17.890625, 18.5546875, 19.21875, 19.8828125, 20.546875, 21.2109375, 21.875, 22.5390625, 23.203125, 23.8671875, 24.53125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 11.0, 19.0, 16.0, 24.0, 37.0, 43.0, 47.0, 98.0, 114.0, 169.0, 216.0, 262.0, 351.0, 412.0, 439.0, 399.0, 335.0, 258.0, 197.0, 169.0, 120.0, 89.0, 52.0, 54.0, 32.0, 20.0, 20.0, 12.0, 11.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.140625, -10.78564453125, -10.4306640625, -10.07568359375, -9.720703125, -9.36572265625, -9.0107421875, -8.65576171875, -8.30078125, -7.94580078125, -7.5908203125, -7.23583984375, -6.880859375, -6.52587890625, -6.1708984375, -5.81591796875, -5.4609375, -5.10595703125, -4.7509765625, -4.39599609375, -4.041015625, -3.68603515625, -3.3310546875, -2.97607421875, -2.62109375, -2.26611328125, -1.9111328125, -1.55615234375, -1.201171875, -0.84619140625, -0.4912109375, -0.13623046875, 0.21875, 0.57373046875, 0.9287109375, 1.28369140625, 1.638671875, 1.99365234375, 2.3486328125, 2.70361328125, 3.05859375, 3.41357421875, 3.7685546875, 4.12353515625, 4.478515625, 4.83349609375, 5.1884765625, 5.54345703125, 5.8984375, 6.25341796875, 6.6083984375, 6.96337890625, 7.318359375, 7.67333984375, 8.0283203125, 8.38330078125, 8.73828125, 9.09326171875, 9.4482421875, 9.80322265625, 10.158203125, 10.51318359375, 10.8681640625, 11.22314453125, 11.578125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 11.0, 18.0, 14.0, 28.0, 33.0, 48.0, 60.0, 89.0, 129.0, 203.0, 315.0, 503.0, 1567.0, 16376.0, 624180.0, 3353531.0, 188394.0, 6572.0, 957.0, 407.0, 242.0, 175.0, 101.0, 95.0, 61.0, 43.0, 37.0, 23.0, 18.0, 9.0, 8.0, 9.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.578125, -26.6982421875, -25.818359375, -24.9384765625, -24.05859375, -23.1787109375, -22.298828125, -21.4189453125, -20.5390625, -19.6591796875, -18.779296875, -17.8994140625, -17.01953125, -16.1396484375, -15.259765625, -14.3798828125, -13.5, -12.6201171875, -11.740234375, -10.8603515625, -9.98046875, -9.1005859375, -8.220703125, -7.3408203125, -6.4609375, -5.5810546875, -4.701171875, -3.8212890625, -2.94140625, -2.0615234375, -1.181640625, -0.3017578125, 0.578125, 1.4580078125, 2.337890625, 3.2177734375, 4.09765625, 4.9775390625, 5.857421875, 6.7373046875, 7.6171875, 8.4970703125, 9.376953125, 10.2568359375, 11.13671875, 12.0166015625, 12.896484375, 13.7763671875, 14.65625, 15.5361328125, 16.416015625, 17.2958984375, 18.17578125, 19.0556640625, 19.935546875, 20.8154296875, 21.6953125, 22.5751953125, 23.455078125, 24.3349609375, 25.21484375, 26.0947265625, 26.974609375, 27.8544921875, 28.734375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 17.0, 45.0, 72.0, 140.0, 206.0, 231.0, 146.0, 80.0, 45.0, 20.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.32610321044922, -116.27906036376953, -113.23200988769531, -110.18496704101562, -107.13792419433594, -104.09087371826172, -101.04383087158203, -97.99678039550781, -94.94973754882812, -91.90269470214844, -88.85564422607422, -85.80860137939453, -82.76155090332031, -79.71450805664062, -76.66746520996094, -73.62042236328125, -70.57337188720703, -67.52632904052734, -64.47927856445312, -61.43223571777344, -58.385189056396484, -55.33814239501953, -52.291099548339844, -49.24405288696289, -46.19700622558594, -43.149959564208984, -40.10291290283203, -37.055870056152344, -34.00882339477539, -30.961776733398438, -27.914731979370117, -24.867687225341797, -21.820648193359375, -18.773601531982422, -15.726556777954102, -12.679511070251465, -9.632465362548828, -6.585419654846191, -3.5383739471435547, -0.4913291931152344, 2.5557174682617188, 5.6027631759643555, 8.649808883666992, 11.696854591369629, 14.743900299072266, 17.79094696044922, 20.83799171447754, 23.88503646850586, 26.932083129882812, 29.979129791259766, 33.02617645263672, 36.073219299316406, 39.12026596069336, 42.16731262207031, 45.21435546875, 48.26140213012695, 51.308448791503906, 54.35549545288086, 57.40254211425781, 60.4495849609375, 63.49663162231445, 66.5436782836914, 69.5907211303711, 72.63777160644531, 75.684814453125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 8.0, 6.0, 13.0, 8.0, 12.0, 13.0, 16.0, 19.0, 30.0, 18.0, 26.0, 32.0, 40.0, 38.0, 36.0, 33.0, 48.0, 41.0, 27.0, 27.0, 47.0, 42.0, 40.0, 26.0, 50.0, 44.0, 31.0, 33.0, 24.0, 16.0, 28.0, 22.0, 12.0, 17.0, 12.0, 8.0, 12.0, 8.0, 7.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.032493591308594, -29.87095069885254, -28.709407806396484, -27.547866821289062, -26.386323928833008, -25.224781036376953, -24.0632381439209, -22.901695251464844, -21.740154266357422, -20.578611373901367, -19.417068481445312, -18.25552749633789, -17.093984603881836, -15.932441711425781, -14.770898818969727, -13.609356880187988, -12.447813034057617, -11.286270141601562, -10.124728202819824, -8.96318531036377, -7.801642894744873, -6.640100479125977, -5.478557586669922, -4.317015647888184, -3.155472755432129, -1.9939302206039429, -0.8323876857757568, 0.32915496826171875, 1.4906973838806152, 2.6522397994995117, 3.8137826919555664, 4.975324630737305, 6.136867523193359, 7.298409938812256, 8.459952354431152, 9.621495246887207, 10.783037185668945, 11.944580078125, 13.106122970581055, 14.267664909362793, 15.429207801818848, 16.590749740600586, 17.75229263305664, 18.913835525512695, 20.07537841796875, 21.236919403076172, 22.39846420288086, 23.56000518798828, 24.721548080444336, 25.88309097290039, 27.044633865356445, 28.2061767578125, 29.367717742919922, 30.529260635375977, 31.69080352783203, 32.85234451293945, 34.01388931274414, 35.17543029785156, 36.33697509765625, 37.49851608276367, 38.66006088256836, 39.82160186767578, 40.98314666748047, 42.14468765258789, 43.30622863769531]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 10.0, 10.0, 17.0, 23.0, 22.0, 23.0, 22.0, 40.0, 49.0, 34.0, 45.0, 53.0, 53.0, 62.0, 38.0, 50.0, 55.0, 51.0, 41.0, 49.0, 43.0, 37.0, 26.0, 23.0, 20.0, 16.0, 21.0, 13.0, 16.0, 9.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.19635009765625, -4.9942626953125, -4.79217529296875, -4.590087890625, -4.38800048828125, -4.1859130859375, -3.98382568359375, -3.78173828125, -3.57965087890625, -3.3775634765625, -3.17547607421875, -2.973388671875, -2.77130126953125, -2.5692138671875, -2.36712646484375, -2.1650390625, -1.96295166015625, -1.7608642578125, -1.55877685546875, -1.356689453125, -1.15460205078125, -0.9525146484375, -0.75042724609375, -0.54833984375, -0.34625244140625, -0.1441650390625, 0.05792236328125, 0.260009765625, 0.46209716796875, 0.6641845703125, 0.86627197265625, 1.068359375, 1.27044677734375, 1.4725341796875, 1.67462158203125, 1.876708984375, 2.07879638671875, 2.2808837890625, 2.48297119140625, 2.68505859375, 2.88714599609375, 3.0892333984375, 3.29132080078125, 3.493408203125, 3.69549560546875, 3.8975830078125, 4.09967041015625, 4.3017578125, 4.50384521484375, 4.7059326171875, 4.90802001953125, 5.110107421875, 5.31219482421875, 5.5142822265625, 5.71636962890625, 5.91845703125, 6.12054443359375, 6.3226318359375, 6.52471923828125, 6.726806640625, 6.92889404296875, 7.1309814453125, 7.33306884765625, 7.53515625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 6.0, 4.0, 12.0, 16.0, 23.0, 27.0, 49.0, 75.0, 107.0, 190.0, 289.0, 432.0, 610.0, 983.0, 1531.0, 2238.0, 3490.0, 4872.0, 7490.0, 11368.0, 16852.0, 25797.0, 39578.0, 61426.0, 95631.0, 147396.0, 189593.0, 153337.0, 100035.0, 63772.0, 41387.0, 26777.0, 17890.0, 11686.0, 7831.0, 5283.0, 3629.0, 2390.0, 1632.0, 1004.0, 617.0, 425.0, 277.0, 194.0, 115.0, 82.0, 52.0, 31.0, 10.0, 8.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3732795715332031, -0.36106109619140625, -0.3488426208496094, -0.3366241455078125, -0.3244056701660156, -0.31218719482421875, -0.2999687194824219, -0.287750244140625, -0.2755317687988281, -0.26331329345703125, -0.2510948181152344, -0.2388763427734375, -0.22665786743164062, -0.21443939208984375, -0.20222091674804688, -0.19000244140625, -0.17778396606445312, -0.16556549072265625, -0.15334701538085938, -0.1411285400390625, -0.12891006469726562, -0.11669158935546875, -0.10447311401367188, -0.092254638671875, -0.08003616333007812, -0.06781768798828125, -0.055599212646484375, -0.0433807373046875, -0.031162261962890625, -0.01894378662109375, -0.006725311279296875, 0.0054931640625, 0.017711639404296875, 0.02993011474609375, 0.042148590087890625, 0.0543670654296875, 0.06658554077148438, 0.07880401611328125, 0.09102249145507812, 0.103240966796875, 0.11545944213867188, 0.12767791748046875, 0.13989639282226562, 0.1521148681640625, 0.16433334350585938, 0.17655181884765625, 0.18877029418945312, 0.20098876953125, 0.21320724487304688, 0.22542572021484375, 0.23764419555664062, 0.2498626708984375, 0.2620811462402344, 0.27429962158203125, 0.2865180969238281, 0.298736572265625, 0.3109550476074219, 0.32317352294921875, 0.3353919982910156, 0.3476104736328125, 0.3598289489746094, 0.37204742431640625, 0.3842658996582031, 0.396484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 8.0, 11.0, 8.0, 14.0, 16.0, 17.0, 20.0, 21.0, 29.0, 30.0, 28.0, 27.0, 30.0, 28.0, 32.0, 39.0, 34.0, 40.0, 1070.0, 33.0, 52.0, 37.0, 38.0, 32.0, 36.0, 31.0, 40.0, 37.0, 22.0, 21.0, 19.0, 31.0, 16.0, 7.0, 11.0, 7.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.162109375, -3.0589599609375, -2.955810546875, -2.8526611328125, -2.74951171875, -2.6463623046875, -2.543212890625, -2.4400634765625, -2.3369140625, -2.2337646484375, -2.130615234375, -2.0274658203125, -1.92431640625, -1.8211669921875, -1.718017578125, -1.6148681640625, -1.51171875, -1.4085693359375, -1.305419921875, -1.2022705078125, -1.09912109375, -0.9959716796875, -0.892822265625, -0.7896728515625, -0.6865234375, -0.5833740234375, -0.480224609375, -0.3770751953125, -0.27392578125, -0.1707763671875, -0.067626953125, 0.0355224609375, 0.138671875, 0.2418212890625, 0.344970703125, 0.4481201171875, 0.55126953125, 0.6544189453125, 0.757568359375, 0.8607177734375, 0.9638671875, 1.0670166015625, 1.170166015625, 1.2733154296875, 1.37646484375, 1.4796142578125, 1.582763671875, 1.6859130859375, 1.7890625, 1.8922119140625, 1.995361328125, 2.0985107421875, 2.20166015625, 2.3048095703125, 2.407958984375, 2.5111083984375, 2.6142578125, 2.7174072265625, 2.820556640625, 2.9237060546875, 3.02685546875, 3.1300048828125, 3.233154296875, 3.3363037109375, 3.439453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 10.0, 7.0, 12.0, 26.0, 36.0, 57.0, 62.0, 96.0, 150.0, 234.0, 333.0, 446.0, 734.0, 1195.0, 1797.0, 2792.0, 4224.0, 6683.0, 10502.0, 16838.0, 26446.0, 41941.0, 66105.0, 103386.0, 153481.0, 1232142.0, 150657.0, 100715.0, 64177.0, 40870.0, 25854.0, 16321.0, 10293.0, 6629.0, 4197.0, 2704.0, 1717.0, 1150.0, 690.0, 458.0, 310.0, 220.0, 159.0, 107.0, 55.0, 35.0, 25.0, 20.0, 11.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.34375, -0.3331642150878906, -0.32257843017578125, -0.3119926452636719, -0.3014068603515625, -0.2908210754394531, -0.28023529052734375, -0.2696495056152344, -0.259063720703125, -0.24847793579101562, -0.23789215087890625, -0.22730636596679688, -0.2167205810546875, -0.20613479614257812, -0.19554901123046875, -0.18496322631835938, -0.17437744140625, -0.16379165649414062, -0.15320587158203125, -0.14262008666992188, -0.1320343017578125, -0.12144851684570312, -0.11086273193359375, -0.10027694702148438, -0.089691162109375, -0.07910537719726562, -0.06851959228515625, -0.057933807373046875, -0.0473480224609375, -0.036762237548828125, -0.02617645263671875, -0.015590667724609375, -0.0050048828125, 0.005580902099609375, 0.01616668701171875, 0.026752471923828125, 0.0373382568359375, 0.047924041748046875, 0.05850982666015625, 0.06909561157226562, 0.079681396484375, 0.09026718139648438, 0.10085296630859375, 0.11143875122070312, 0.1220245361328125, 0.13261032104492188, 0.14319610595703125, 0.15378189086914062, 0.16436767578125, 0.17495346069335938, 0.18553924560546875, 0.19612503051757812, 0.2067108154296875, 0.21729660034179688, 0.22788238525390625, 0.23846817016601562, 0.249053955078125, 0.2596397399902344, 0.27022552490234375, 0.2808113098144531, 0.2913970947265625, 0.3019828796386719, 0.31256866455078125, 0.3231544494628906, 0.333740234375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 5.0, 7.0, 20.0, 21.0, 16.0, 23.0, 36.0, 47.0, 57.0, 55.0, 59.0, 75.0, 70.0, 59.0, 66.0, 57.0, 54.0, 52.0, 48.0, 34.0, 27.0, 20.0, 24.0, 14.0, 12.0, 5.0, 5.0, 6.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011997222900390625, -0.0011571943759918213, -0.00111466646194458, -0.0010721385478973389, -0.0010296106338500977, -0.0009870827198028564, -0.0009445548057556152, -0.000902026891708374, -0.0008594989776611328, -0.0008169710636138916, -0.0007744431495666504, -0.0007319152355194092, -0.000689387321472168, -0.0006468594074249268, -0.0006043314933776855, -0.0005618035793304443, -0.0005192756652832031, -0.0004767477512359619, -0.0004342198371887207, -0.0003916919231414795, -0.0003491640090942383, -0.00030663609504699707, -0.00026410818099975586, -0.00022158026695251465, -0.00017905235290527344, -0.00013652443885803223, -9.399652481079102e-05, -5.1468610763549805e-05, -8.940696716308594e-06, 3.358721733093262e-05, 7.611513137817383e-05, 0.00011864304542541504, 0.00016117095947265625, 0.00020369887351989746, 0.00024622678756713867, 0.0002887547016143799, 0.0003312826156616211, 0.0003738105297088623, 0.0004163384437561035, 0.0004588663578033447, 0.0005013942718505859, 0.0005439221858978271, 0.0005864500999450684, 0.0006289780139923096, 0.0006715059280395508, 0.000714033842086792, 0.0007565617561340332, 0.0007990896701812744, 0.0008416175842285156, 0.0008841454982757568, 0.000926673412322998, 0.0009692013263702393, 0.0010117292404174805, 0.0010542571544647217, 0.0010967850685119629, 0.001139312982559204, 0.0011818408966064453, 0.0012243688106536865, 0.0012668967247009277, 0.001309424638748169, 0.0013519525527954102, 0.0013944804668426514, 0.0014370083808898926, 0.0014795362949371338, 0.001522064208984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 6.0, 9.0, 5.0, 15.0, 17.0, 35.0, 30.0, 43.0, 66.0, 100.0, 175.0, 335.0, 812.0, 19305.0, 1018849.0, 7211.0, 758.0, 274.0, 144.0, 116.0, 75.0, 40.0, 30.0, 33.0, 15.0, 18.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.031890869140625, -0.0309906005859375, -0.03009033203125, -0.0291900634765625, -0.028289794921875, -0.0273895263671875, -0.0264892578125, -0.0255889892578125, -0.024688720703125, -0.0237884521484375, -0.02288818359375, -0.0219879150390625, -0.021087646484375, -0.0201873779296875, -0.019287109375, -0.0183868408203125, -0.017486572265625, -0.0165863037109375, -0.01568603515625, -0.0147857666015625, -0.013885498046875, -0.0129852294921875, -0.0120849609375, -0.0111846923828125, -0.010284423828125, -0.0093841552734375, -0.00848388671875, -0.0075836181640625, -0.006683349609375, -0.0057830810546875, -0.0048828125, -0.0039825439453125, -0.003082275390625, -0.0021820068359375, -0.00128173828125, -0.0003814697265625, 0.000518798828125, 0.0014190673828125, 0.0023193359375, 0.0032196044921875, 0.004119873046875, 0.0050201416015625, 0.00592041015625, 0.0068206787109375, 0.007720947265625, 0.0086212158203125, 0.009521484375, 0.0104217529296875, 0.011322021484375, 0.0122222900390625, 0.01312255859375, 0.0140228271484375, 0.014923095703125, 0.0158233642578125, 0.0167236328125, 0.0176239013671875, 0.018524169921875, 0.0194244384765625, 0.02032470703125, 0.0212249755859375, 0.022125244140625, 0.0230255126953125, 0.02392578125, 0.0248260498046875, 0.025726318359375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 12.0, 19.0, 54.0, 90.0, 120.0, 189.0, 155.0, 153.0, 109.0, 55.0, 22.0, 12.0, 10.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015501226298511028, -0.0015071295201778412, -0.0014641364105045795, -0.001421143300831318, -0.0013781501911580563, -0.0013351570814847946, -0.001292163971811533, -0.0012491707457229495, -0.0012061776360496879, -0.0011631845263764262, -0.0011201914167031646, -0.001077198307029903, -0.0010342051973566413, -0.0009912119712680578, -0.0009482189198024571, -0.0009052257519215345, -0.0008622327004559338, -0.0008192395907826722, -0.0007762464811094105, -0.000733253313228488, -0.0006902602035552263, -0.0006472670938819647, -0.000604273984208703, -0.0005612808745354414, -0.0005182877648621798, -0.0004752946551889181, -0.000432301516411826, -0.00038930840673856437, -0.00034631526796147227, -0.00030332215828821063, -0.000260329048614949, -0.0002173359098378569, -0.0001743427710607648, -0.00013134964683558792, -8.835652988636866e-05, -4.5363412937149405e-05, -2.3702887119725347e-06, 4.0622835513204336e-05, 8.361594518646598e-05, 0.00012660908396355808, 0.00016960219363681972, 0.0002125953178619966, 0.00025558844208717346, 0.0002985815517604351, 0.00034157466143369675, 0.00038456780021078885, 0.0004275609098840505, 0.0004705540486611426, 0.0005135471583344042, 0.0005565402680076659, 0.0005995333776809275, 0.0006425265455618501, 0.0006855196552351117, 0.0007285127649083734, 0.000771505874581635, 0.0008144989842548966, 0.0008574920939281583, 0.0009004852036014199, 0.0009434783132746816, 0.0009864714229479432, 0.0010294645326212049, 0.0010724577587097883, 0.00111545086838305, 0.0011584439780563116, 0.0012014370877295732]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 7.0, 3.0, 11.0, 7.0, 12.0, 8.0, 14.0, 11.0, 21.0, 19.0, 24.0, 29.0, 27.0, 27.0, 41.0, 28.0, 41.0, 48.0, 32.0, 36.0, 33.0, 46.0, 31.0, 49.0, 41.0, 37.0, 31.0, 39.0, 22.0, 29.0, 28.0, 20.0, 27.0, 25.0, 20.0, 13.0, 16.0, 4.0, 8.0, 11.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005868673324584961, -0.000568232499063015, -0.0005495976656675339, -0.0005309628322720528, -0.0005123279988765717, -0.0004936931654810905, -0.00047505833208560944, -0.0004564234986901283, -0.0004377886652946472, -0.0004191538318991661, -0.000400518998503685, -0.0003818841651082039, -0.0003632493317127228, -0.00034461449831724167, -0.00032597966492176056, -0.00030734483152627945, -0.00028870999813079834, -0.00027007516473531723, -0.0002514403313398361, -0.000232805497944355, -0.0002141706645488739, -0.0001955358311533928, -0.00017690099775791168, -0.00015826616436243057, -0.00013963133096694946, -0.00012099649757146835, -0.00010236166417598724, -8.372683078050613e-05, -6.509199738502502e-05, -4.6457163989543915e-05, -2.7822330594062805e-05, -9.187497198581696e-06, 9.447336196899414e-06, 2.8082169592380524e-05, 4.671700298786163e-05, 6.535183638334274e-05, 8.398666977882385e-05, 0.00010262150317430496, 0.00012125633656978607, 0.00013989116996526718, 0.0001585260033607483, 0.0001771608367562294, 0.0001957956701517105, 0.00021443050354719162, 0.00023306533694267273, 0.00025170017033815384, 0.00027033500373363495, 0.00028896983712911606, 0.00030760467052459717, 0.0003262395039200783, 0.0003448743373155594, 0.0003635091707110405, 0.0003821440041065216, 0.0004007788375020027, 0.0004194136708974838, 0.00043804850429296494, 0.00045668333768844604, 0.00047531817108392715, 0.0004939530044794083, 0.0005125878378748894, 0.0005312226712703705, 0.0005498575046658516, 0.0005684923380613327, 0.0005871271714568138, 0.0006057620048522949]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 10.0, 10.0, 17.0, 23.0, 22.0, 23.0, 22.0, 40.0, 49.0, 34.0, 45.0, 52.0, 54.0, 62.0, 38.0, 50.0, 55.0, 51.0, 41.0, 49.0, 43.0, 37.0, 26.0, 23.0, 20.0, 16.0, 21.0, 13.0, 16.0, 9.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.19635009765625, -4.9942626953125, -4.79217529296875, -4.590087890625, -4.38800048828125, -4.1859130859375, -3.98382568359375, -3.78173828125, -3.57965087890625, -3.3775634765625, -3.17547607421875, -2.973388671875, -2.77130126953125, -2.5692138671875, -2.36712646484375, -2.1650390625, -1.96295166015625, -1.7608642578125, -1.55877685546875, -1.356689453125, -1.15460205078125, -0.9525146484375, -0.75042724609375, -0.54833984375, -0.34625244140625, -0.1441650390625, 0.05792236328125, 0.260009765625, 0.46209716796875, 0.6641845703125, 0.86627197265625, 1.068359375, 1.27044677734375, 1.4725341796875, 1.67462158203125, 1.876708984375, 2.07879638671875, 2.2808837890625, 2.48297119140625, 2.68505859375, 2.88714599609375, 3.0892333984375, 3.29132080078125, 3.493408203125, 3.69549560546875, 3.8975830078125, 4.09967041015625, 4.3017578125, 4.50384521484375, 4.7059326171875, 4.90802001953125, 5.110107421875, 5.31219482421875, 5.5142822265625, 5.71636962890625, 5.91845703125, 6.12054443359375, 6.3226318359375, 6.52471923828125, 6.726806640625, 6.92889404296875, 7.1309814453125, 7.33306884765625, 7.53515625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 12.0, 10.0, 16.0, 20.0, 19.0, 39.0, 47.0, 81.0, 123.0, 232.0, 339.0, 632.0, 1290.0, 2653.0, 5845.0, 12352.0, 25966.0, 52539.0, 105078.0, 215558.0, 309392.0, 161488.0, 78577.0, 39557.0, 19122.0, 9159.0, 4201.0, 1960.0, 960.0, 488.0, 287.0, 152.0, 118.0, 64.0, 51.0, 23.0, 27.0, 21.0, 9.0, 4.0, 10.0, 5.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.85546875, -4.7003173828125, -4.545166015625, -4.3900146484375, -4.23486328125, -4.0797119140625, -3.924560546875, -3.7694091796875, -3.6142578125, -3.4591064453125, -3.303955078125, -3.1488037109375, -2.99365234375, -2.8385009765625, -2.683349609375, -2.5281982421875, -2.373046875, -2.2178955078125, -2.062744140625, -1.9075927734375, -1.75244140625, -1.5972900390625, -1.442138671875, -1.2869873046875, -1.1318359375, -0.9766845703125, -0.821533203125, -0.6663818359375, -0.51123046875, -0.3560791015625, -0.200927734375, -0.0457763671875, 0.109375, 0.2645263671875, 0.419677734375, 0.5748291015625, 0.72998046875, 0.8851318359375, 1.040283203125, 1.1954345703125, 1.3505859375, 1.5057373046875, 1.660888671875, 1.8160400390625, 1.97119140625, 2.1263427734375, 2.281494140625, 2.4366455078125, 2.591796875, 2.7469482421875, 2.902099609375, 3.0572509765625, 3.21240234375, 3.3675537109375, 3.522705078125, 3.6778564453125, 3.8330078125, 3.9881591796875, 4.143310546875, 4.2984619140625, 4.45361328125, 4.6087646484375, 4.763916015625, 4.9190673828125, 5.07421875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 6.0, 5.0, 3.0, 5.0, 7.0, 17.0, 12.0, 10.0, 23.0, 12.0, 13.0, 13.0, 21.0, 26.0, 31.0, 32.0, 27.0, 33.0, 38.0, 46.0, 65.0, 141.0, 314.0, 1400.0, 213.0, 84.0, 69.0, 49.0, 38.0, 30.0, 28.0, 18.0, 20.0, 24.0, 27.0, 24.0, 26.0, 18.0, 15.0, 13.0, 13.0, 7.0, 8.0, 5.0, 4.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-16.015625, -15.517822265625, -15.02001953125, -14.522216796875, -14.0244140625, -13.526611328125, -13.02880859375, -12.531005859375, -12.033203125, -11.535400390625, -11.03759765625, -10.539794921875, -10.0419921875, -9.544189453125, -9.04638671875, -8.548583984375, -8.05078125, -7.552978515625, -7.05517578125, -6.557373046875, -6.0595703125, -5.561767578125, -5.06396484375, -4.566162109375, -4.068359375, -3.570556640625, -3.07275390625, -2.574951171875, -2.0771484375, -1.579345703125, -1.08154296875, -0.583740234375, -0.0859375, 0.411865234375, 0.90966796875, 1.407470703125, 1.9052734375, 2.403076171875, 2.90087890625, 3.398681640625, 3.896484375, 4.394287109375, 4.89208984375, 5.389892578125, 5.8876953125, 6.385498046875, 6.88330078125, 7.381103515625, 7.87890625, 8.376708984375, 8.87451171875, 9.372314453125, 9.8701171875, 10.367919921875, 10.86572265625, 11.363525390625, 11.861328125, 12.359130859375, 12.85693359375, 13.354736328125, 13.8525390625, 14.350341796875, 14.84814453125, 15.345947265625, 15.84375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 10.0, 3.0, 9.0, 8.0, 24.0, 23.0, 25.0, 39.0, 51.0, 68.0, 94.0, 137.0, 163.0, 289.0, 550.0, 2160.0, 1708812.0, 1429722.0, 2092.0, 543.0, 273.0, 175.0, 113.0, 68.0, 57.0, 53.0, 36.0, 27.0, 18.0, 13.0, 16.0, 8.0, 5.0, 7.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.8125, -44.861328125, -42.91015625, -40.958984375, -39.0078125, -37.056640625, -35.10546875, -33.154296875, -31.203125, -29.251953125, -27.30078125, -25.349609375, -23.3984375, -21.447265625, -19.49609375, -17.544921875, -15.59375, -13.642578125, -11.69140625, -9.740234375, -7.7890625, -5.837890625, -3.88671875, -1.935546875, 0.015625, 1.966796875, 3.91796875, 5.869140625, 7.8203125, 9.771484375, 11.72265625, 13.673828125, 15.625, 17.576171875, 19.52734375, 21.478515625, 23.4296875, 25.380859375, 27.33203125, 29.283203125, 31.234375, 33.185546875, 35.13671875, 37.087890625, 39.0390625, 40.990234375, 42.94140625, 44.892578125, 46.84375, 48.794921875, 50.74609375, 52.697265625, 54.6484375, 56.599609375, 58.55078125, 60.501953125, 62.453125, 64.404296875, 66.35546875, 68.306640625, 70.2578125, 72.208984375, 74.16015625, 76.111328125, 78.0625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 99.0, 563.0, 328.0, 22.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-266.1383972167969, -261.0935363769531, -256.04864501953125, -251.00376892089844, -245.95889282226562, -240.9140167236328, -235.869140625, -230.82427978515625, -225.77938842773438, -220.73451232910156, -215.68963623046875, -210.64476013183594, -205.59988403320312, -200.5550079345703, -195.5101318359375, -190.46527099609375, -185.42039489746094, -180.37551879882812, -175.3306427001953, -170.2857666015625, -165.2408905029297, -160.19601440429688, -155.15113830566406, -150.10626220703125, -145.0614013671875, -140.0165252685547, -134.97164916992188, -129.92677307128906, -124.88189697265625, -119.83702087402344, -114.79215240478516, -109.74727630615234, -104.70240020751953, -99.65752410888672, -94.6126480102539, -89.5677719116211, -84.52290344238281, -79.47802734375, -74.43315124511719, -69.38827514648438, -64.34339904785156, -59.29852294921875, -54.25364685058594, -49.20877456665039, -44.16389846801758, -39.119022369384766, -34.07415008544922, -29.029273986816406, -23.984397888183594, -18.93952178955078, -13.894647598266602, -8.849772453308105, -3.8048973083496094, 1.2399787902832031, 6.284852981567383, 11.329727172851562, 16.374603271484375, 21.419479370117188, 26.464353561401367, 31.509227752685547, 36.55410385131836, 41.59897994995117, 46.64385223388672, 51.68872833251953, 56.733604431152344]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 4.0, 5.0, 11.0, 9.0, 11.0, 17.0, 13.0, 19.0, 16.0, 18.0, 22.0, 19.0, 23.0, 26.0, 34.0, 39.0, 53.0, 39.0, 35.0, 47.0, 36.0, 38.0, 36.0, 39.0, 53.0, 48.0, 23.0, 41.0, 31.0, 20.0, 19.0, 19.0, 25.0, 17.0, 14.0, 13.0, 11.0, 13.0, 8.0, 7.0, 3.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.213050842285156, -51.61225891113281, -50.01146697998047, -48.41067886352539, -46.80988693237305, -45.2090950012207, -43.608306884765625, -42.00751495361328, -40.40672302246094, -38.805931091308594, -37.20513916015625, -35.60435104370117, -34.00355911254883, -32.402767181396484, -30.801977157592773, -29.201187133789062, -27.60039520263672, -25.999603271484375, -24.398813247680664, -22.798023223876953, -21.19723129272461, -19.596439361572266, -17.995649337768555, -16.394859313964844, -14.7940673828125, -13.193276405334473, -11.592485427856445, -9.991694450378418, -8.39090347290039, -6.790112495422363, -5.189321517944336, -3.5885305404663086, -1.9877395629882812, -0.3869485855102539, 1.2138423919677734, 2.814633369445801, 4.415424346923828, 6.0162153244018555, 7.617006301879883, 9.21779727935791, 10.818588256835938, 12.419379234313965, 14.020170211791992, 15.62096118927002, 17.221752166748047, 18.82254409790039, 20.4233341217041, 22.024124145507812, 23.624916076660156, 25.2257080078125, 26.82649803161621, 28.427288055419922, 30.028079986572266, 31.62887191772461, 33.22966003417969, 34.83045196533203, 36.431243896484375, 38.03203582763672, 39.63282775878906, 41.23361587524414, 42.834407806396484, 44.43519973754883, 46.035987854003906, 47.63677978515625, 49.237571716308594]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 8.0, 11.0, 14.0, 17.0, 17.0, 15.0, 26.0, 30.0, 28.0, 24.0, 40.0, 43.0, 43.0, 44.0, 42.0, 46.0, 58.0, 40.0, 46.0, 63.0, 47.0, 45.0, 33.0, 37.0, 31.0, 19.0, 20.0, 23.0, 21.0, 14.0, 14.0, 13.0, 7.0, 8.0, 4.0, 7.0, 3.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.75830078125, -5.5439453125, -5.32958984375, -5.115234375, -4.90087890625, -4.6865234375, -4.47216796875, -4.2578125, -4.04345703125, -3.8291015625, -3.61474609375, -3.400390625, -3.18603515625, -2.9716796875, -2.75732421875, -2.54296875, -2.32861328125, -2.1142578125, -1.89990234375, -1.685546875, -1.47119140625, -1.2568359375, -1.04248046875, -0.828125, -0.61376953125, -0.3994140625, -0.18505859375, 0.029296875, 0.24365234375, 0.4580078125, 0.67236328125, 0.88671875, 1.10107421875, 1.3154296875, 1.52978515625, 1.744140625, 1.95849609375, 2.1728515625, 2.38720703125, 2.6015625, 2.81591796875, 3.0302734375, 3.24462890625, 3.458984375, 3.67333984375, 3.8876953125, 4.10205078125, 4.31640625, 4.53076171875, 4.7451171875, 4.95947265625, 5.173828125, 5.38818359375, 5.6025390625, 5.81689453125, 6.03125, 6.24560546875, 6.4599609375, 6.67431640625, 6.888671875, 7.10302734375, 7.3173828125, 7.53173828125, 7.74609375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 3.0, 5.0, 8.0, 11.0, 15.0, 13.0, 17.0, 31.0, 29.0, 35.0, 53.0, 47.0, 105.0, 241.0, 580.0, 2709.0, 46087.0, 1527712.0, 2497631.0, 112881.0, 4543.0, 860.0, 264.0, 122.0, 61.0, 52.0, 18.0, 28.0, 23.0, 21.0, 16.0, 11.0, 11.0, 10.0, 8.0, 9.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.90625, -17.26953125, -16.6328125, -15.99609375, -15.359375, -14.72265625, -14.0859375, -13.44921875, -12.8125, -12.17578125, -11.5390625, -10.90234375, -10.265625, -9.62890625, -8.9921875, -8.35546875, -7.71875, -7.08203125, -6.4453125, -5.80859375, -5.171875, -4.53515625, -3.8984375, -3.26171875, -2.625, -1.98828125, -1.3515625, -0.71484375, -0.078125, 0.55859375, 1.1953125, 1.83203125, 2.46875, 3.10546875, 3.7421875, 4.37890625, 5.015625, 5.65234375, 6.2890625, 6.92578125, 7.5625, 8.19921875, 8.8359375, 9.47265625, 10.109375, 10.74609375, 11.3828125, 12.01953125, 12.65625, 13.29296875, 13.9296875, 14.56640625, 15.203125, 15.83984375, 16.4765625, 17.11328125, 17.75, 18.38671875, 19.0234375, 19.66015625, 20.296875, 20.93359375, 21.5703125, 22.20703125, 22.84375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 6.0, 9.0, 15.0, 26.0, 27.0, 47.0, 67.0, 119.0, 191.0, 287.0, 382.0, 505.0, 599.0, 532.0, 411.0, 275.0, 209.0, 145.0, 93.0, 45.0, 34.0, 16.0, 19.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.356689453125, -8.82275390625, -8.288818359375, -7.7548828125, -7.220947265625, -6.68701171875, -6.153076171875, -5.619140625, -5.085205078125, -4.55126953125, -4.017333984375, -3.4833984375, -2.949462890625, -2.41552734375, -1.881591796875, -1.34765625, -0.813720703125, -0.27978515625, 0.254150390625, 0.7880859375, 1.322021484375, 1.85595703125, 2.389892578125, 2.923828125, 3.457763671875, 3.99169921875, 4.525634765625, 5.0595703125, 5.593505859375, 6.12744140625, 6.661376953125, 7.1953125, 7.729248046875, 8.26318359375, 8.797119140625, 9.3310546875, 9.864990234375, 10.39892578125, 10.932861328125, 11.466796875, 12.000732421875, 12.53466796875, 13.068603515625, 13.6025390625, 14.136474609375, 14.67041015625, 15.204345703125, 15.73828125, 16.272216796875, 16.80615234375, 17.340087890625, 17.8740234375, 18.407958984375, 18.94189453125, 19.475830078125, 20.009765625, 20.543701171875, 21.07763671875, 21.611572265625, 22.1455078125, 22.679443359375, 23.21337890625, 23.747314453125, 24.28125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 11.0, 25.0, 23.0, 42.0, 72.0, 127.0, 212.0, 285.0, 520.0, 1786.0, 320612.0, 3854938.0, 13749.0, 869.0, 373.0, 257.0, 148.0, 79.0, 51.0, 29.0, 29.0, 19.0, 13.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.9375, -79.1494140625, -77.361328125, -75.5732421875, -73.78515625, -71.9970703125, -70.208984375, -68.4208984375, -66.6328125, -64.8447265625, -63.056640625, -61.2685546875, -59.48046875, -57.6923828125, -55.904296875, -54.1162109375, -52.328125, -50.5400390625, -48.751953125, -46.9638671875, -45.17578125, -43.3876953125, -41.599609375, -39.8115234375, -38.0234375, -36.2353515625, -34.447265625, -32.6591796875, -30.87109375, -29.0830078125, -27.294921875, -25.5068359375, -23.71875, -21.9306640625, -20.142578125, -18.3544921875, -16.56640625, -14.7783203125, -12.990234375, -11.2021484375, -9.4140625, -7.6259765625, -5.837890625, -4.0498046875, -2.26171875, -0.4736328125, 1.314453125, 3.1025390625, 4.890625, 6.6787109375, 8.466796875, 10.2548828125, 12.04296875, 13.8310546875, 15.619140625, 17.4072265625, 19.1953125, 20.9833984375, 22.771484375, 24.5595703125, 26.34765625, 28.1357421875, 29.923828125, 31.7119140625, 33.5]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 56.0, 237.0, 398.0, 237.0, 64.0, 12.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.09307861328125, -123.33033752441406, -117.5676040649414, -111.80486297607422, -106.04212951660156, -100.27938842773438, -94.51664733886719, -88.75391387939453, -82.99118041992188, -77.22843933105469, -71.46570587158203, -65.70296478271484, -59.94023132324219, -54.177490234375, -48.41475296020508, -42.652015686035156, -36.88927459716797, -31.126537322998047, -25.363800048828125, -19.60106086730957, -13.838323593139648, -8.075586318969727, -2.312847137451172, 3.44989013671875, 9.212627410888672, 14.975364685058594, 20.738101959228516, 26.50084114074707, 32.263580322265625, 38.02631378173828, 43.78905487060547, 49.55179214477539, 55.31452941894531, 61.077266693115234, 66.84000396728516, 72.60274505615234, 78.365478515625, 84.12821960449219, 89.89096069335938, 95.65369415283203, 101.41642761230469, 107.17916870117188, 112.94190216064453, 118.70464324951172, 124.46737670898438, 130.23011779785156, 135.99285888671875, 141.75558471679688, 147.51834106445312, 153.2810821533203, 159.0438232421875, 164.80654907226562, 170.5692901611328, 176.33203125, 182.0947723388672, 187.85751342773438, 193.6202392578125, 199.3829803466797, 205.14572143554688, 210.908447265625, 216.6711883544922, 222.43392944335938, 228.19667053222656, 233.95941162109375, 239.72213745117188]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 4.0, 1.0, 8.0, 8.0, 9.0, 9.0, 9.0, 19.0, 12.0, 31.0, 32.0, 28.0, 32.0, 33.0, 51.0, 33.0, 39.0, 50.0, 41.0, 31.0, 37.0, 45.0, 38.0, 47.0, 34.0, 48.0, 36.0, 29.0, 33.0, 19.0, 31.0, 13.0, 16.0, 20.0, 18.0, 16.0, 6.0, 12.0, 4.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.532196044921875, -39.180660247802734, -37.82912063598633, -36.47758483886719, -35.12604904174805, -33.774513244628906, -32.4229736328125, -31.07143783569336, -29.719900131225586, -28.368362426757812, -27.016826629638672, -25.6652889251709, -24.313751220703125, -22.962215423583984, -21.61067771911621, -20.259140014648438, -18.907604217529297, -17.556066513061523, -16.204530715942383, -14.85299301147461, -13.501456260681152, -12.149919509887695, -10.798381805419922, -9.446845054626465, -8.095308303833008, -6.743771553039551, -5.3922343254089355, -4.04069709777832, -2.6891603469848633, -1.3376235961914062, 0.013914108276367188, 1.3654508590698242, 2.7169837951660156, 4.068520545959473, 5.420057773590088, 6.771595001220703, 8.12313175201416, 9.474668502807617, 10.82620620727539, 12.177742958068848, 13.529279708862305, 14.880816459655762, 16.23235321044922, 17.583890914916992, 18.935428619384766, 20.286964416503906, 21.63850212097168, 22.990039825439453, 24.341575622558594, 25.693113327026367, 27.044649124145508, 28.39618682861328, 29.747722625732422, 31.099260330200195, 32.45079803466797, 33.80233383178711, 35.15386962890625, 36.50540542602539, 37.8569450378418, 39.20848083496094, 40.56001663208008, 41.91155242919922, 43.263092041015625, 44.614627838134766, 45.96616744995117]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 16.0, 9.0, 14.0, 28.0, 20.0, 25.0, 30.0, 32.0, 24.0, 45.0, 39.0, 44.0, 49.0, 44.0, 39.0, 54.0, 58.0, 56.0, 50.0, 51.0, 32.0, 29.0, 30.0, 19.0, 33.0, 21.0, 28.0, 13.0, 12.0, 10.0, 8.0, 9.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.1854248046875, -4.980224609375, -4.7750244140625, -4.56982421875, -4.3646240234375, -4.159423828125, -3.9542236328125, -3.7490234375, -3.5438232421875, -3.338623046875, -3.1334228515625, -2.92822265625, -2.7230224609375, -2.517822265625, -2.3126220703125, -2.107421875, -1.9022216796875, -1.697021484375, -1.4918212890625, -1.28662109375, -1.0814208984375, -0.876220703125, -0.6710205078125, -0.4658203125, -0.2606201171875, -0.055419921875, 0.1497802734375, 0.35498046875, 0.5601806640625, 0.765380859375, 0.9705810546875, 1.17578125, 1.3809814453125, 1.586181640625, 1.7913818359375, 1.99658203125, 2.2017822265625, 2.406982421875, 2.6121826171875, 2.8173828125, 3.0225830078125, 3.227783203125, 3.4329833984375, 3.63818359375, 3.8433837890625, 4.048583984375, 4.2537841796875, 4.458984375, 4.6641845703125, 4.869384765625, 5.0745849609375, 5.27978515625, 5.4849853515625, 5.690185546875, 5.8953857421875, 6.1005859375, 6.3057861328125, 6.510986328125, 6.7161865234375, 6.92138671875, 7.1265869140625, 7.331787109375, 7.5369873046875, 7.7421875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 18.0, 10.0, 17.0, 30.0, 42.0, 57.0, 94.0, 105.0, 183.0, 267.0, 386.0, 584.0, 902.0, 1338.0, 2002.0, 2987.0, 4740.0, 7309.0, 11482.0, 17703.0, 28207.0, 44224.0, 69633.0, 107740.0, 163500.0, 191305.0, 140936.0, 90954.0, 58243.0, 37265.0, 23647.0, 15017.0, 9546.0, 6231.0, 3957.0, 2648.0, 1691.0, 1227.0, 759.0, 509.0, 331.0, 237.0, 159.0, 102.0, 68.0, 60.0, 38.0, 20.0, 17.0, 13.0, 8.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.43798828125, -0.4248390197753906, -0.41168975830078125, -0.3985404968261719, -0.3853912353515625, -0.3722419738769531, -0.35909271240234375, -0.3459434509277344, -0.332794189453125, -0.3196449279785156, -0.30649566650390625, -0.2933464050292969, -0.2801971435546875, -0.2670478820800781, -0.25389862060546875, -0.24074935913085938, -0.22760009765625, -0.21445083618164062, -0.20130157470703125, -0.18815231323242188, -0.1750030517578125, -0.16185379028320312, -0.14870452880859375, -0.13555526733398438, -0.122406005859375, -0.10925674438476562, -0.09610748291015625, -0.08295822143554688, -0.0698089599609375, -0.056659698486328125, -0.04351043701171875, -0.030361175537109375, -0.0172119140625, -0.004062652587890625, 0.00908660888671875, 0.022235870361328125, 0.0353851318359375, 0.048534393310546875, 0.06168365478515625, 0.07483291625976562, 0.087982177734375, 0.10113143920898438, 0.11428070068359375, 0.12742996215820312, 0.1405792236328125, 0.15372848510742188, 0.16687774658203125, 0.18002700805664062, 0.19317626953125, 0.20632553100585938, 0.21947479248046875, 0.23262405395507812, 0.2457733154296875, 0.2589225769042969, 0.27207183837890625, 0.2852210998535156, 0.298370361328125, 0.3115196228027344, 0.32466888427734375, 0.3378181457519531, 0.3509674072265625, 0.3641166687011719, 0.37726593017578125, 0.3904151916503906, 0.403564453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 8.0, 12.0, 10.0, 16.0, 20.0, 27.0, 19.0, 26.0, 29.0, 38.0, 34.0, 32.0, 40.0, 30.0, 42.0, 48.0, 47.0, 1068.0, 33.0, 36.0, 46.0, 39.0, 44.0, 40.0, 26.0, 31.0, 26.0, 19.0, 23.0, 17.0, 16.0, 10.0, 13.0, 8.0, 4.0, 4.0, 13.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.9140625, -3.798187255859375, -3.68231201171875, -3.566436767578125, -3.4505615234375, -3.334686279296875, -3.21881103515625, -3.102935791015625, -2.987060546875, -2.871185302734375, -2.75531005859375, -2.639434814453125, -2.5235595703125, -2.407684326171875, -2.29180908203125, -2.175933837890625, -2.06005859375, -1.944183349609375, -1.82830810546875, -1.712432861328125, -1.5965576171875, -1.480682373046875, -1.36480712890625, -1.248931884765625, -1.133056640625, -1.017181396484375, -0.90130615234375, -0.785430908203125, -0.6695556640625, -0.553680419921875, -0.43780517578125, -0.321929931640625, -0.2060546875, -0.090179443359375, 0.02569580078125, 0.141571044921875, 0.2574462890625, 0.373321533203125, 0.48919677734375, 0.605072021484375, 0.720947265625, 0.836822509765625, 0.95269775390625, 1.068572998046875, 1.1844482421875, 1.300323486328125, 1.41619873046875, 1.532073974609375, 1.64794921875, 1.763824462890625, 1.87969970703125, 1.995574951171875, 2.1114501953125, 2.227325439453125, 2.34320068359375, 2.459075927734375, 2.574951171875, 2.690826416015625, 2.80670166015625, 2.922576904296875, 3.0384521484375, 3.154327392578125, 3.27020263671875, 3.386077880859375, 3.501953125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 7.0, 8.0, 9.0, 23.0, 29.0, 59.0, 72.0, 114.0, 177.0, 253.0, 407.0, 647.0, 977.0, 1437.0, 2273.0, 3567.0, 5518.0, 8478.0, 12817.0, 19913.0, 30633.0, 46954.0, 71823.0, 108964.0, 151333.0, 1216983.0, 138771.0, 96053.0, 62833.0, 40628.0, 26457.0, 17178.0, 11107.0, 7210.0, 4696.0, 3120.0, 1983.0, 1235.0, 878.0, 546.0, 331.0, 224.0, 148.0, 82.0, 63.0, 52.0, 20.0, 14.0, 7.0, 8.0, 9.0, 2.0, 5.0, 1.0, 2.0], "bins": [-0.37451171875, -0.3636054992675781, -0.35269927978515625, -0.3417930603027344, -0.3308868408203125, -0.3199806213378906, -0.30907440185546875, -0.2981681823730469, -0.287261962890625, -0.2763557434082031, -0.26544952392578125, -0.2545433044433594, -0.2436370849609375, -0.23273086547851562, -0.22182464599609375, -0.21091842651367188, -0.20001220703125, -0.18910598754882812, -0.17819976806640625, -0.16729354858398438, -0.1563873291015625, -0.14548110961914062, -0.13457489013671875, -0.12366867065429688, -0.112762451171875, -0.10185623168945312, -0.09095001220703125, -0.08004379272460938, -0.0691375732421875, -0.058231353759765625, -0.04732513427734375, -0.036418914794921875, -0.0255126953125, -0.014606475830078125, -0.00370025634765625, 0.007205963134765625, 0.0181121826171875, 0.029018402099609375, 0.03992462158203125, 0.050830841064453125, 0.061737060546875, 0.07264328002929688, 0.08354949951171875, 0.09445571899414062, 0.1053619384765625, 0.11626815795898438, 0.12717437744140625, 0.13808059692382812, 0.14898681640625, 0.15989303588867188, 0.17079925537109375, 0.18170547485351562, 0.1926116943359375, 0.20351791381835938, 0.21442413330078125, 0.22533035278320312, 0.236236572265625, 0.24714279174804688, 0.25804901123046875, 0.2689552307128906, 0.2798614501953125, 0.2907676696777344, 0.30167388916015625, 0.3125801086425781, 0.323486328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 10.0, 10.0, 20.0, 15.0, 26.0, 28.0, 32.0, 44.0, 46.0, 52.0, 58.0, 68.0, 60.0, 59.0, 61.0, 61.0, 59.0, 48.0, 53.0, 46.0, 30.0, 25.0, 16.0, 20.0, 13.0, 9.0, 8.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013570785522460938, -0.0013088881969451904, -0.0012606978416442871, -0.0012125074863433838, -0.0011643171310424805, -0.0011161267757415771, -0.0010679364204406738, -0.0010197460651397705, -0.0009715557098388672, -0.0009233653545379639, -0.0008751749992370605, -0.0008269846439361572, -0.0007787942886352539, -0.0007306039333343506, -0.0006824135780334473, -0.0006342232227325439, -0.0005860328674316406, -0.0005378425121307373, -0.000489652156829834, -0.00044146180152893066, -0.00039327144622802734, -0.000345081090927124, -0.0002968907356262207, -0.0002487003803253174, -0.00020051002502441406, -0.00015231966972351074, -0.00010412931442260742, -5.59389591217041e-05, -7.748603820800781e-06, 4.044175148010254e-05, 8.863210678100586e-05, 0.00013682246208190918, 0.0001850128173828125, 0.00023320317268371582, 0.00028139352798461914, 0.00032958388328552246, 0.0003777742385864258, 0.0004259645938873291, 0.0004741549491882324, 0.0005223453044891357, 0.0005705356597900391, 0.0006187260150909424, 0.0006669163703918457, 0.000715106725692749, 0.0007632970809936523, 0.0008114874362945557, 0.000859677791595459, 0.0009078681468963623, 0.0009560585021972656, 0.001004248857498169, 0.0010524392127990723, 0.0011006295680999756, 0.001148819923400879, 0.0011970102787017822, 0.0012452006340026855, 0.0012933909893035889, 0.0013415813446044922, 0.0013897716999053955, 0.0014379620552062988, 0.0014861524105072021, 0.0015343427658081055, 0.0015825331211090088, 0.0016307234764099121, 0.0016789138317108154, 0.0017271041870117188]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 16.0, 20.0, 17.0, 31.0, 32.0, 56.0, 85.0, 109.0, 171.0, 373.0, 1184.0, 462298.0, 581960.0, 1230.0, 416.0, 169.0, 102.0, 66.0, 63.0, 44.0, 27.0, 17.0, 18.0, 11.0, 6.0, 10.0, 4.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03790283203125, -0.036820411682128906, -0.03573799133300781, -0.03465557098388672, -0.033573150634765625, -0.03249073028564453, -0.03140830993652344, -0.030325889587402344, -0.02924346923828125, -0.028161048889160156, -0.027078628540039062, -0.02599620819091797, -0.024913787841796875, -0.02383136749267578, -0.022748947143554688, -0.021666526794433594, -0.0205841064453125, -0.019501686096191406, -0.018419265747070312, -0.01733684539794922, -0.016254425048828125, -0.015172004699707031, -0.014089584350585938, -0.013007164001464844, -0.01192474365234375, -0.010842323303222656, -0.009759902954101562, -0.008677482604980469, -0.007595062255859375, -0.006512641906738281, -0.0054302215576171875, -0.004347801208496094, -0.003265380859375, -0.0021829605102539062, -0.0011005401611328125, -1.811981201171875e-05, 0.001064300537109375, 0.0021467208862304688, 0.0032291412353515625, 0.004311561584472656, 0.00539398193359375, 0.006476402282714844, 0.0075588226318359375, 0.008641242980957031, 0.009723663330078125, 0.010806083679199219, 0.011888504028320312, 0.012970924377441406, 0.0140533447265625, 0.015135765075683594, 0.016218185424804688, 0.01730060577392578, 0.018383026123046875, 0.01946544647216797, 0.020547866821289062, 0.021630287170410156, 0.02271270751953125, 0.023795127868652344, 0.024877548217773438, 0.02595996856689453, 0.027042388916015625, 0.02812480926513672, 0.029207229614257812, 0.030289649963378906, 0.0313720703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 12.0, 83.0, 316.0, 414.0, 163.0, 24.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012022546725347638, -0.0010945876128971577, -0.0009869205532595515, -0.0008792535518296063, -0.0007715865503996611, -0.0006639194907620549, -0.0005562524311244488, -0.00044858542969450355, -0.0003409183700568974, -0.00023325133952312171, -0.0001255842944374308, -1.7917249351739883e-05, 8.97497811820358e-05, 0.0001974168117158115, 0.00030508387135341763, 0.00041275087278336287, 0.000520417932420969, 0.0006280849920585752, 0.0007357519934885204, 0.0008434190531261265, 0.0009510860545560718, 0.001058753114193678, 0.001166420173831284, 0.0012740872334688902, 0.0013817541766911745, 0.0014894212363287807, 0.0015970882959663868, 0.0017047552391886711, 0.0018124222988262773, 0.0019200893584638834, 0.0020277565345168114, 0.0021354234777390957, 0.0022430906537920237, 0.002350757597014308, 0.002458424773067236, 0.0025660917162895203, 0.0026737588923424482, 0.0027814258355647326, 0.0028890930116176605, 0.002996759954839945, 0.003104426898062229, 0.0032120938412845135, 0.0033197610173374414, 0.0034274279605597258, 0.0035350951366126537, 0.003642762079834938, 0.0037504290230572224, 0.0038580961991101503, 0.003965763375163078, 0.004073430318385363, 0.004181097261607647, 0.004288764670491219, 0.004396431613713503, 0.004504098556935787, 0.0046117655001580715, 0.004719432443380356, 0.00482709938660264, 0.0049347663298249245, 0.005042433273047209, 0.00515010068193078, 0.005257767625153065, 0.005365434568375349, 0.005473101511597633, 0.005580768454819918, 0.005688435863703489]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 8.0, 3.0, 15.0, 7.0, 10.0, 13.0, 15.0, 18.0, 24.0, 26.0, 33.0, 21.0, 38.0, 22.0, 35.0, 37.0, 36.0, 35.0, 42.0, 45.0, 44.0, 45.0, 32.0, 50.0, 38.0, 25.0, 40.0, 25.0, 40.0, 21.0, 24.0, 25.0, 8.0, 15.0, 13.0, 20.0, 19.0, 7.0, 8.0, 4.0, 0.0, 2.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000577092170715332, -0.0005559744313359261, -0.0005348566919565201, -0.0005137389525771141, -0.0004926212131977081, -0.00047150347381830215, -0.0004503857344388962, -0.0004292679950594902, -0.00040815025568008423, -0.00038703251630067825, -0.0003659147769212723, -0.0003447970375418663, -0.00032367929816246033, -0.00030256155878305435, -0.0002814438194036484, -0.0002603260800242424, -0.00023920834064483643, -0.00021809060126543045, -0.00019697286188602448, -0.0001758551225066185, -0.00015473738312721252, -0.00013361964374780655, -0.00011250190436840057, -9.13841649889946e-05, -7.026642560958862e-05, -4.914868623018265e-05, -2.8030946850776672e-05, -6.913207471370697e-06, 1.4204531908035278e-05, 3.5322271287441254e-05, 5.644001066684723e-05, 7.75577500462532e-05, 9.867548942565918e-05, 0.00011979322880506516, 0.00014091096818447113, 0.0001620287075638771, 0.00018314644694328308, 0.00020426418632268906, 0.00022538192570209503, 0.000246499665081501, 0.000267617404460907, 0.00028873514384031296, 0.00030985288321971893, 0.0003309706225991249, 0.0003520883619785309, 0.00037320610135793686, 0.00039432384073734283, 0.0004154415801167488, 0.0004365593194961548, 0.00045767705887556076, 0.00047879479825496674, 0.0004999125376343727, 0.0005210302770137787, 0.0005421480163931847, 0.0005632657557725906, 0.0005843834951519966, 0.0006055012345314026, 0.0006266189739108086, 0.0006477367132902145, 0.0006688544526696205, 0.0006899721920490265, 0.0007110899314284325, 0.0007322076708078384, 0.0007533254101872444, 0.0007744431495666504]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 16.0, 9.0, 14.0, 28.0, 20.0, 25.0, 30.0, 32.0, 24.0, 45.0, 39.0, 44.0, 49.0, 44.0, 39.0, 54.0, 58.0, 56.0, 50.0, 51.0, 32.0, 29.0, 30.0, 19.0, 33.0, 21.0, 28.0, 13.0, 12.0, 10.0, 8.0, 9.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.1854248046875, -4.980224609375, -4.7750244140625, -4.56982421875, -4.3646240234375, -4.159423828125, -3.9542236328125, -3.7490234375, -3.5438232421875, -3.338623046875, -3.1334228515625, -2.92822265625, -2.7230224609375, -2.517822265625, -2.3126220703125, -2.107421875, -1.9022216796875, -1.697021484375, -1.4918212890625, -1.28662109375, -1.0814208984375, -0.876220703125, -0.6710205078125, -0.4658203125, -0.2606201171875, -0.055419921875, 0.1497802734375, 0.35498046875, 0.5601806640625, 0.765380859375, 0.9705810546875, 1.17578125, 1.3809814453125, 1.586181640625, 1.7913818359375, 1.99658203125, 2.2017822265625, 2.406982421875, 2.6121826171875, 2.8173828125, 3.0225830078125, 3.227783203125, 3.4329833984375, 3.63818359375, 3.8433837890625, 4.048583984375, 4.2537841796875, 4.458984375, 4.6641845703125, 4.869384765625, 5.0745849609375, 5.27978515625, 5.4849853515625, 5.690185546875, 5.8953857421875, 6.1005859375, 6.3057861328125, 6.510986328125, 6.7161865234375, 6.92138671875, 7.1265869140625, 7.331787109375, 7.5369873046875, 7.7421875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 13.0, 17.0, 15.0, 25.0, 48.0, 66.0, 116.0, 169.0, 225.0, 399.0, 689.0, 1142.0, 2262.0, 4514.0, 9722.0, 21865.0, 52206.0, 129725.0, 300145.0, 300907.0, 129755.0, 53081.0, 22018.0, 9714.0, 4535.0, 2275.0, 1189.0, 609.0, 398.0, 234.0, 135.0, 107.0, 82.0, 31.0, 33.0, 22.0, 9.0, 16.0, 8.0, 6.0, 3.0, 4.0, 10.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-5.14453125, -4.9608154296875, -4.777099609375, -4.5933837890625, -4.40966796875, -4.2259521484375, -4.042236328125, -3.8585205078125, -3.6748046875, -3.4910888671875, -3.307373046875, -3.1236572265625, -2.93994140625, -2.7562255859375, -2.572509765625, -2.3887939453125, -2.205078125, -2.0213623046875, -1.837646484375, -1.6539306640625, -1.47021484375, -1.2864990234375, -1.102783203125, -0.9190673828125, -0.7353515625, -0.5516357421875, -0.367919921875, -0.1842041015625, -0.00048828125, 0.1832275390625, 0.366943359375, 0.5506591796875, 0.734375, 0.9180908203125, 1.101806640625, 1.2855224609375, 1.46923828125, 1.6529541015625, 1.836669921875, 2.0203857421875, 2.2041015625, 2.3878173828125, 2.571533203125, 2.7552490234375, 2.93896484375, 3.1226806640625, 3.306396484375, 3.4901123046875, 3.673828125, 3.8575439453125, 4.041259765625, 4.2249755859375, 4.40869140625, 4.5924072265625, 4.776123046875, 4.9598388671875, 5.1435546875, 5.3272705078125, 5.510986328125, 5.6947021484375, 5.87841796875, 6.0621337890625, 6.245849609375, 6.4295654296875, 6.61328125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 6.0, 8.0, 3.0, 4.0, 4.0, 4.0, 8.0, 11.0, 7.0, 11.0, 13.0, 18.0, 25.0, 26.0, 28.0, 21.0, 33.0, 25.0, 40.0, 43.0, 50.0, 83.0, 131.0, 227.0, 1429.0, 234.0, 133.0, 70.0, 41.0, 39.0, 37.0, 38.0, 39.0, 21.0, 23.0, 18.0, 16.0, 14.0, 17.0, 8.0, 15.0, 5.0, 9.0, 6.0, 1.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.328125, -16.759765625, -16.19140625, -15.623046875, -15.0546875, -14.486328125, -13.91796875, -13.349609375, -12.78125, -12.212890625, -11.64453125, -11.076171875, -10.5078125, -9.939453125, -9.37109375, -8.802734375, -8.234375, -7.666015625, -7.09765625, -6.529296875, -5.9609375, -5.392578125, -4.82421875, -4.255859375, -3.6875, -3.119140625, -2.55078125, -1.982421875, -1.4140625, -0.845703125, -0.27734375, 0.291015625, 0.859375, 1.427734375, 1.99609375, 2.564453125, 3.1328125, 3.701171875, 4.26953125, 4.837890625, 5.40625, 5.974609375, 6.54296875, 7.111328125, 7.6796875, 8.248046875, 8.81640625, 9.384765625, 9.953125, 10.521484375, 11.08984375, 11.658203125, 12.2265625, 12.794921875, 13.36328125, 13.931640625, 14.5, 15.068359375, 15.63671875, 16.205078125, 16.7734375, 17.341796875, 17.91015625, 18.478515625, 19.046875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 6.0, 9.0, 11.0, 18.0, 25.0, 20.0, 32.0, 43.0, 79.0, 119.0, 202.0, 400.0, 913.0, 18236.0, 3118910.0, 5061.0, 668.0, 340.0, 209.0, 128.0, 79.0, 48.0, 43.0, 35.0, 14.0, 13.0, 8.0, 8.0, 4.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.1875, -94.275390625, -91.36328125, -88.451171875, -85.5390625, -82.626953125, -79.71484375, -76.802734375, -73.890625, -70.978515625, -68.06640625, -65.154296875, -62.2421875, -59.330078125, -56.41796875, -53.505859375, -50.59375, -47.681640625, -44.76953125, -41.857421875, -38.9453125, -36.033203125, -33.12109375, -30.208984375, -27.296875, -24.384765625, -21.47265625, -18.560546875, -15.6484375, -12.736328125, -9.82421875, -6.912109375, -4.0, -1.087890625, 1.82421875, 4.736328125, 7.6484375, 10.560546875, 13.47265625, 16.384765625, 19.296875, 22.208984375, 25.12109375, 28.033203125, 30.9453125, 33.857421875, 36.76953125, 39.681640625, 42.59375, 45.505859375, 48.41796875, 51.330078125, 54.2421875, 57.154296875, 60.06640625, 62.978515625, 65.890625, 68.802734375, 71.71484375, 74.626953125, 77.5390625, 80.451171875, 83.36328125, 86.275390625, 89.1875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 41.0, 75.0, 154.0, 236.0, 228.0, 157.0, 79.0, 23.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.55328369140625, -45.788604736328125, -44.023921966552734, -42.25924301147461, -40.494564056396484, -38.729881286621094, -36.96520233154297, -35.200523376464844, -33.43584442138672, -31.67116355895996, -29.906484603881836, -28.141803741455078, -26.377124786376953, -24.612443923950195, -22.847763061523438, -21.083084106445312, -19.318401336669922, -17.553720474243164, -15.789041519165039, -14.024360656738281, -12.25968074798584, -10.495000839233398, -8.73031997680664, -6.965640068054199, -5.200960159301758, -3.4362800121307373, -1.6715998649597168, 0.09308052062988281, 1.8577604293823242, 3.6224403381347656, 5.387121200561523, 7.151801109313965, 8.916481018066406, 10.681160926818848, 12.445840835571289, 14.210521697998047, 15.975201606750488, 17.73988151550293, 19.504562377929688, 21.269241333007812, 23.03392219543457, 24.798603057861328, 26.563282012939453, 28.32796287536621, 30.09264373779297, 31.857322692871094, 33.62200164794922, 35.38668441772461, 37.151363372802734, 38.91604232788086, 40.68072509765625, 42.445404052734375, 44.2100830078125, 45.974761962890625, 47.739444732666016, 49.50412368774414, 51.26880645751953, 53.033485412597656, 54.79816818237305, 56.56284713745117, 58.3275260925293, 60.09220886230469, 61.85688781738281, 63.62156677246094, 65.38624572753906]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 5.0, 10.0, 8.0, 9.0, 17.0, 20.0, 14.0, 13.0, 18.0, 20.0, 16.0, 30.0, 27.0, 33.0, 27.0, 35.0, 38.0, 28.0, 37.0, 38.0, 34.0, 48.0, 37.0, 42.0, 43.0, 35.0, 29.0, 25.0, 34.0, 29.0, 25.0, 22.0, 22.0, 17.0, 19.0, 13.0, 8.0, 17.0, 13.0, 8.0, 4.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-45.83510971069336, -44.48036575317383, -43.12561798095703, -41.7708740234375, -40.41613006591797, -39.06138229370117, -37.70663833618164, -36.351890563964844, -34.99714660644531, -33.64240264892578, -32.287654876708984, -30.932910919189453, -29.57816505432129, -28.223419189453125, -26.868675231933594, -25.51392936706543, -24.159183502197266, -22.8044376373291, -21.449691772460938, -20.094947814941406, -18.740201950073242, -17.385456085205078, -16.030712127685547, -14.675966262817383, -13.321220397949219, -11.966474533081055, -10.611729621887207, -9.25698471069336, -7.902238845825195, -6.5474934577941895, -5.192748069763184, -3.838003158569336, -2.4832534790039062, -1.1285080909729004, 0.22623729705810547, 1.5809826850891113, 2.935728073120117, 4.290473461151123, 5.645218849182129, 6.999963760375977, 8.35470962524414, 9.709455490112305, 11.064200401306152, 12.4189453125, 13.773691177368164, 15.128437042236328, 16.48318099975586, 17.837926864624023, 19.192672729492188, 20.54741859436035, 21.902164459228516, 23.256908416748047, 24.61165428161621, 25.966400146484375, 27.321144104003906, 28.67588996887207, 30.030635833740234, 31.3853816986084, 32.74012756347656, 34.094871520996094, 35.449615478515625, 36.80436325073242, 38.15910720825195, 39.51385498046875, 40.86859893798828]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 6.0, 10.0, 9.0, 9.0, 20.0, 16.0, 17.0, 31.0, 25.0, 18.0, 33.0, 31.0, 33.0, 43.0, 39.0, 49.0, 40.0, 45.0, 51.0, 55.0, 61.0, 46.0, 42.0, 34.0, 33.0, 33.0, 31.0, 20.0, 21.0, 23.0, 15.0, 18.0, 19.0, 8.0, 2.0, 6.0, 7.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.74609375, -5.52716064453125, -5.3082275390625, -5.08929443359375, -4.870361328125, -4.65142822265625, -4.4324951171875, -4.21356201171875, -3.99462890625, -3.77569580078125, -3.5567626953125, -3.33782958984375, -3.118896484375, -2.89996337890625, -2.6810302734375, -2.46209716796875, -2.2431640625, -2.02423095703125, -1.8052978515625, -1.58636474609375, -1.367431640625, -1.14849853515625, -0.9295654296875, -0.71063232421875, -0.49169921875, -0.27276611328125, -0.0538330078125, 0.16510009765625, 0.384033203125, 0.60296630859375, 0.8218994140625, 1.04083251953125, 1.259765625, 1.47869873046875, 1.6976318359375, 1.91656494140625, 2.135498046875, 2.35443115234375, 2.5733642578125, 2.79229736328125, 3.01123046875, 3.23016357421875, 3.4490966796875, 3.66802978515625, 3.886962890625, 4.10589599609375, 4.3248291015625, 4.54376220703125, 4.7626953125, 4.98162841796875, 5.2005615234375, 5.41949462890625, 5.638427734375, 5.85736083984375, 6.0762939453125, 6.29522705078125, 6.51416015625, 6.73309326171875, 6.9520263671875, 7.17095947265625, 7.389892578125, 7.60882568359375, 7.8277587890625, 8.04669189453125, 8.265625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 4.0, 4.0, 3.0, 7.0, 4.0, 8.0, 6.0, 11.0, 19.0, 21.0, 39.0, 38.0, 47.0, 53.0, 91.0, 146.0, 210.0, 415.0, 1053.0, 4270.0, 31103.0, 330693.0, 1988301.0, 1600767.0, 212096.0, 20046.0, 3004.0, 845.0, 364.0, 209.0, 103.0, 82.0, 45.0, 45.0, 34.0, 21.0, 23.0, 15.0, 8.0, 15.0, 7.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.078125, -10.6663818359375, -10.254638671875, -9.8428955078125, -9.43115234375, -9.0194091796875, -8.607666015625, -8.1959228515625, -7.7841796875, -7.3724365234375, -6.960693359375, -6.5489501953125, -6.13720703125, -5.7254638671875, -5.313720703125, -4.9019775390625, -4.490234375, -4.0784912109375, -3.666748046875, -3.2550048828125, -2.84326171875, -2.4315185546875, -2.019775390625, -1.6080322265625, -1.1962890625, -0.7845458984375, -0.372802734375, 0.0389404296875, 0.45068359375, 0.8624267578125, 1.274169921875, 1.6859130859375, 2.09765625, 2.5093994140625, 2.921142578125, 3.3328857421875, 3.74462890625, 4.1563720703125, 4.568115234375, 4.9798583984375, 5.3916015625, 5.8033447265625, 6.215087890625, 6.6268310546875, 7.03857421875, 7.4503173828125, 7.862060546875, 8.2738037109375, 8.685546875, 9.0972900390625, 9.509033203125, 9.9207763671875, 10.33251953125, 10.7442626953125, 11.156005859375, 11.5677490234375, 11.9794921875, 12.3912353515625, 12.802978515625, 13.2147216796875, 13.62646484375, 14.0382080078125, 14.449951171875, 14.8616943359375, 15.2734375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 4.0, 3.0, 9.0, 6.0, 14.0, 15.0, 14.0, 27.0, 41.0, 46.0, 75.0, 120.0, 152.0, 182.0, 253.0, 317.0, 409.0, 433.0, 422.0, 392.0, 309.0, 230.0, 174.0, 127.0, 85.0, 56.0, 37.0, 42.0, 27.0, 12.0, 10.0, 5.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.09375, -12.693603515625, -12.29345703125, -11.893310546875, -11.4931640625, -11.093017578125, -10.69287109375, -10.292724609375, -9.892578125, -9.492431640625, -9.09228515625, -8.692138671875, -8.2919921875, -7.891845703125, -7.49169921875, -7.091552734375, -6.69140625, -6.291259765625, -5.89111328125, -5.490966796875, -5.0908203125, -4.690673828125, -4.29052734375, -3.890380859375, -3.490234375, -3.090087890625, -2.68994140625, -2.289794921875, -1.8896484375, -1.489501953125, -1.08935546875, -0.689208984375, -0.2890625, 0.111083984375, 0.51123046875, 0.911376953125, 1.3115234375, 1.711669921875, 2.11181640625, 2.511962890625, 2.912109375, 3.312255859375, 3.71240234375, 4.112548828125, 4.5126953125, 4.912841796875, 5.31298828125, 5.713134765625, 6.11328125, 6.513427734375, 6.91357421875, 7.313720703125, 7.7138671875, 8.114013671875, 8.51416015625, 8.914306640625, 9.314453125, 9.714599609375, 10.11474609375, 10.514892578125, 10.9150390625, 11.315185546875, 11.71533203125, 12.115478515625, 12.515625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 12.0, 8.0, 15.0, 24.0, 40.0, 55.0, 64.0, 101.0, 154.0, 226.0, 337.0, 526.0, 1643.0, 93952.0, 3881716.0, 211358.0, 2319.0, 581.0, 349.0, 231.0, 170.0, 115.0, 81.0, 59.0, 32.0, 29.0, 17.0, 20.0, 7.0, 2.0, 10.0, 3.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.84375, -41.48681640625, -40.1298828125, -38.77294921875, -37.416015625, -36.05908203125, -34.7021484375, -33.34521484375, -31.98828125, -30.63134765625, -29.2744140625, -27.91748046875, -26.560546875, -25.20361328125, -23.8466796875, -22.48974609375, -21.1328125, -19.77587890625, -18.4189453125, -17.06201171875, -15.705078125, -14.34814453125, -12.9912109375, -11.63427734375, -10.27734375, -8.92041015625, -7.5634765625, -6.20654296875, -4.849609375, -3.49267578125, -2.1357421875, -0.77880859375, 0.578125, 1.93505859375, 3.2919921875, 4.64892578125, 6.005859375, 7.36279296875, 8.7197265625, 10.07666015625, 11.43359375, 12.79052734375, 14.1474609375, 15.50439453125, 16.861328125, 18.21826171875, 19.5751953125, 20.93212890625, 22.2890625, 23.64599609375, 25.0029296875, 26.35986328125, 27.716796875, 29.07373046875, 30.4306640625, 31.78759765625, 33.14453125, 34.50146484375, 35.8583984375, 37.21533203125, 38.572265625, 39.92919921875, 41.2861328125, 42.64306640625, 44.0]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 23.0, 25.0, 39.0, 55.0, 72.0, 95.0, 95.0, 112.0, 114.0, 108.0, 92.0, 63.0, 47.0, 22.0, 15.0, 10.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.18644714355469, -63.49686050415039, -61.807273864746094, -60.1176872253418, -58.4281005859375, -56.7385139465332, -55.048927307128906, -53.359336853027344, -51.66975402832031, -49.980167388916016, -48.29058074951172, -46.60099411010742, -44.911407470703125, -43.22182083129883, -41.53223419189453, -39.84264373779297, -38.15305709838867, -36.463470458984375, -34.77388381958008, -33.08429718017578, -31.394710540771484, -29.705123901367188, -28.015535354614258, -26.32594871520996, -24.636362075805664, -22.946775436401367, -21.25718879699707, -19.56760025024414, -17.878013610839844, -16.188426971435547, -14.49884033203125, -12.809253692626953, -11.119670867919922, -9.430084228515625, -7.74049711227417, -6.050909996032715, -4.361323356628418, -2.671736717224121, -0.9821491241455078, 0.7074375152587891, 2.397024154663086, 4.086610794067383, 5.776197910308838, 7.465785026550293, 9.15537166595459, 10.844958305358887, 12.5345458984375, 14.224132537841797, 15.913719177246094, 17.60330581665039, 19.292892456054688, 20.982479095458984, 22.67206573486328, 24.361652374267578, 26.051240921020508, 27.740827560424805, 29.4304141998291, 31.1200008392334, 32.80958938598633, 34.499176025390625, 36.18876266479492, 37.87834930419922, 39.567935943603516, 41.25752258300781, 42.94710922241211]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 7.0, 6.0, 6.0, 18.0, 14.0, 25.0, 17.0, 14.0, 18.0, 23.0, 20.0, 26.0, 21.0, 29.0, 39.0, 30.0, 39.0, 34.0, 28.0, 43.0, 34.0, 39.0, 43.0, 48.0, 33.0, 38.0, 33.0, 28.0, 35.0, 24.0, 24.0, 25.0, 23.0, 21.0, 17.0, 18.0, 14.0, 4.0, 9.0, 9.0, 6.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-39.19010925292969, -38.00028610229492, -36.810462951660156, -35.620635986328125, -34.43081283569336, -33.240989685058594, -32.05116271972656, -30.861339569091797, -29.67151641845703, -28.481693267822266, -27.291868209838867, -26.10204315185547, -24.912220001220703, -23.722396850585938, -22.53257179260254, -21.34274673461914, -20.152923583984375, -18.96310043334961, -17.77327537536621, -16.583450317382812, -15.393627166748047, -14.203803062438965, -13.013978958129883, -11.8241548538208, -10.634330749511719, -9.444506645202637, -8.254682540893555, -7.064858436584473, -5.875034332275391, -4.685210227966309, -3.4953861236572266, -2.3055620193481445, -1.1157341003417969, 0.07409000396728516, 1.2639141082763672, 2.453738212585449, 3.6435623168945312, 4.833386421203613, 6.023210525512695, 7.213034629821777, 8.40285873413086, 9.592682838439941, 10.782506942749023, 11.972331047058105, 13.162155151367188, 14.35197925567627, 15.541803359985352, 16.73162841796875, 17.921451568603516, 19.11127471923828, 20.30109977722168, 21.490924835205078, 22.680747985839844, 23.87057113647461, 25.060396194458008, 26.250221252441406, 27.440044403076172, 28.629867553710938, 29.819692611694336, 31.009517669677734, 32.1993408203125, 33.389163970947266, 34.57898712158203, 35.76881408691406, 36.95863723754883]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 8.0, 10.0, 9.0, 9.0, 13.0, 18.0, 24.0, 19.0, 35.0, 25.0, 33.0, 37.0, 42.0, 38.0, 42.0, 48.0, 42.0, 47.0, 48.0, 60.0, 51.0, 56.0, 34.0, 49.0, 25.0, 28.0, 29.0, 23.0, 21.0, 15.0, 12.0, 9.0, 7.0, 10.0, 12.0, 8.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.7679443359375, -5.551513671875, -5.3350830078125, -5.11865234375, -4.9022216796875, -4.685791015625, -4.4693603515625, -4.2529296875, -4.0364990234375, -3.820068359375, -3.6036376953125, -3.38720703125, -3.1707763671875, -2.954345703125, -2.7379150390625, -2.521484375, -2.3050537109375, -2.088623046875, -1.8721923828125, -1.65576171875, -1.4393310546875, -1.222900390625, -1.0064697265625, -0.7900390625, -0.5736083984375, -0.357177734375, -0.1407470703125, 0.07568359375, 0.2921142578125, 0.508544921875, 0.7249755859375, 0.94140625, 1.1578369140625, 1.374267578125, 1.5906982421875, 1.80712890625, 2.0235595703125, 2.239990234375, 2.4564208984375, 2.6728515625, 2.8892822265625, 3.105712890625, 3.3221435546875, 3.53857421875, 3.7550048828125, 3.971435546875, 4.1878662109375, 4.404296875, 4.6207275390625, 4.837158203125, 5.0535888671875, 5.27001953125, 5.4864501953125, 5.702880859375, 5.9193115234375, 6.1357421875, 6.3521728515625, 6.568603515625, 6.7850341796875, 7.00146484375, 7.2178955078125, 7.434326171875, 7.6507568359375, 7.8671875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 6.0, 12.0, 27.0, 33.0, 62.0, 80.0, 141.0, 233.0, 381.0, 671.0, 1134.0, 1977.0, 3454.0, 5992.0, 11054.0, 20442.0, 38108.0, 73151.0, 139500.0, 243169.0, 233142.0, 130202.0, 67498.0, 35176.0, 19024.0, 10433.0, 5643.0, 3243.0, 1854.0, 1126.0, 630.0, 363.0, 212.0, 141.0, 77.0, 47.0, 44.0, 20.0, 16.0, 10.0, 11.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5830078125, -0.56353759765625, -0.5440673828125, -0.52459716796875, -0.505126953125, -0.48565673828125, -0.4661865234375, -0.44671630859375, -0.42724609375, -0.40777587890625, -0.3883056640625, -0.36883544921875, -0.349365234375, -0.32989501953125, -0.3104248046875, -0.29095458984375, -0.271484375, -0.25201416015625, -0.2325439453125, -0.21307373046875, -0.193603515625, -0.17413330078125, -0.1546630859375, -0.13519287109375, -0.11572265625, -0.09625244140625, -0.0767822265625, -0.05731201171875, -0.037841796875, -0.01837158203125, 0.0010986328125, 0.02056884765625, 0.0400390625, 0.05950927734375, 0.0789794921875, 0.09844970703125, 0.117919921875, 0.13739013671875, 0.1568603515625, 0.17633056640625, 0.19580078125, 0.21527099609375, 0.2347412109375, 0.25421142578125, 0.273681640625, 0.29315185546875, 0.3126220703125, 0.33209228515625, 0.3515625, 0.37103271484375, 0.3905029296875, 0.40997314453125, 0.429443359375, 0.44891357421875, 0.4683837890625, 0.48785400390625, 0.50732421875, 0.52679443359375, 0.5462646484375, 0.56573486328125, 0.585205078125, 0.60467529296875, 0.6241455078125, 0.64361572265625, 0.6630859375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 14.0, 21.0, 15.0, 28.0, 21.0, 19.0, 26.0, 23.0, 25.0, 43.0, 34.0, 48.0, 43.0, 37.0, 51.0, 1068.0, 35.0, 47.0, 38.0, 39.0, 40.0, 42.0, 43.0, 34.0, 19.0, 16.0, 22.0, 24.0, 15.0, 16.0, 15.0, 8.0, 7.0, 11.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.65509033203125, -3.5289306640625, -3.40277099609375, -3.276611328125, -3.15045166015625, -3.0242919921875, -2.89813232421875, -2.77197265625, -2.64581298828125, -2.5196533203125, -2.39349365234375, -2.267333984375, -2.14117431640625, -2.0150146484375, -1.88885498046875, -1.7626953125, -1.63653564453125, -1.5103759765625, -1.38421630859375, -1.258056640625, -1.13189697265625, -1.0057373046875, -0.87957763671875, -0.75341796875, -0.62725830078125, -0.5010986328125, -0.37493896484375, -0.248779296875, -0.12261962890625, 0.0035400390625, 0.12969970703125, 0.255859375, 0.38201904296875, 0.5081787109375, 0.63433837890625, 0.760498046875, 0.88665771484375, 1.0128173828125, 1.13897705078125, 1.26513671875, 1.39129638671875, 1.5174560546875, 1.64361572265625, 1.769775390625, 1.89593505859375, 2.0220947265625, 2.14825439453125, 2.2744140625, 2.40057373046875, 2.5267333984375, 2.65289306640625, 2.779052734375, 2.90521240234375, 3.0313720703125, 3.15753173828125, 3.28369140625, 3.40985107421875, 3.5360107421875, 3.66217041015625, 3.788330078125, 3.91448974609375, 4.0406494140625, 4.16680908203125, 4.29296875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 6.0, 13.0, 22.0, 40.0, 40.0, 70.0, 99.0, 144.0, 227.0, 358.0, 558.0, 781.0, 1124.0, 1766.0, 2714.0, 3942.0, 6076.0, 9029.0, 13464.0, 19794.0, 29967.0, 44785.0, 67038.0, 99963.0, 142231.0, 1215350.0, 140109.0, 98096.0, 66345.0, 44072.0, 29437.0, 19582.0, 13293.0, 9079.0, 6027.0, 3840.0, 2614.0, 1682.0, 1129.0, 743.0, 496.0, 341.0, 231.0, 148.0, 87.0, 58.0, 43.0, 27.0, 27.0, 9.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.359130859375, -0.3484039306640625, -0.337677001953125, -0.3269500732421875, -0.31622314453125, -0.3054962158203125, -0.294769287109375, -0.2840423583984375, -0.2733154296875, -0.2625885009765625, -0.251861572265625, -0.2411346435546875, -0.23040771484375, -0.2196807861328125, -0.208953857421875, -0.1982269287109375, -0.1875, -0.1767730712890625, -0.166046142578125, -0.1553192138671875, -0.14459228515625, -0.1338653564453125, -0.123138427734375, -0.1124114990234375, -0.1016845703125, -0.0909576416015625, -0.080230712890625, -0.0695037841796875, -0.05877685546875, -0.0480499267578125, -0.037322998046875, -0.0265960693359375, -0.015869140625, -0.0051422119140625, 0.005584716796875, 0.0163116455078125, 0.02703857421875, 0.0377655029296875, 0.048492431640625, 0.0592193603515625, 0.0699462890625, 0.0806732177734375, 0.091400146484375, 0.1021270751953125, 0.11285400390625, 0.1235809326171875, 0.134307861328125, 0.1450347900390625, 0.15576171875, 0.1664886474609375, 0.177215576171875, 0.1879425048828125, 0.19866943359375, 0.2093963623046875, 0.220123291015625, 0.2308502197265625, 0.2415771484375, 0.2523040771484375, 0.263031005859375, 0.2737579345703125, 0.28448486328125, 0.2952117919921875, 0.305938720703125, 0.3166656494140625, 0.327392578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 9.0, 13.0, 13.0, 12.0, 20.0, 25.0, 36.0, 31.0, 46.0, 45.0, 67.0, 67.0, 58.0, 67.0, 73.0, 60.0, 65.0, 41.0, 41.0, 38.0, 41.0, 21.0, 21.0, 17.0, 16.0, 16.0, 6.0, 10.0, 11.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011816024780273438, -0.0011403709650039673, -0.0010991394519805908, -0.0010579079389572144, -0.0010166764259338379, -0.0009754449129104614, -0.000934213399887085, -0.0008929818868637085, -0.000851750373840332, -0.0008105188608169556, -0.0007692873477935791, -0.0007280558347702026, -0.0006868243217468262, -0.0006455928087234497, -0.0006043612957000732, -0.0005631297826766968, -0.0005218982696533203, -0.00048066675662994385, -0.0004394352436065674, -0.0003982037305831909, -0.00035697221755981445, -0.000315740704536438, -0.0002745091915130615, -0.00023327767848968506, -0.0001920461654663086, -0.00015081465244293213, -0.00010958313941955566, -6.83516263961792e-05, -2.7120113372802734e-05, 1.411139965057373e-05, 5.5342912673950195e-05, 9.657442569732666e-05, 0.00013780593872070312, 0.0001790374517440796, 0.00022026896476745605, 0.0002615004777908325, 0.000302731990814209, 0.00034396350383758545, 0.0003851950168609619, 0.0004264265298843384, 0.00046765804290771484, 0.0005088895559310913, 0.0005501210689544678, 0.0005913525819778442, 0.0006325840950012207, 0.0006738156080245972, 0.0007150471210479736, 0.0007562786340713501, 0.0007975101470947266, 0.000838741660118103, 0.0008799731731414795, 0.000921204686164856, 0.0009624361991882324, 0.0010036677122116089, 0.0010448992252349854, 0.0010861307382583618, 0.0011273622512817383, 0.0011685937643051147, 0.0012098252773284912, 0.0012510567903518677, 0.0012922883033752441, 0.0013335198163986206, 0.001374751329421997, 0.0014159828424453735, 0.00145721435546875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 12.0, 10.0, 6.0, 14.0, 23.0, 31.0, 29.0, 40.0, 64.0, 73.0, 86.0, 115.0, 238.0, 566.0, 2644.0, 947660.0, 94929.0, 994.0, 374.0, 205.0, 131.0, 76.0, 54.0, 51.0, 35.0, 19.0, 19.0, 12.0, 12.0, 14.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0289764404296875, -0.02814316749572754, -0.027309894561767578, -0.026476621627807617, -0.025643348693847656, -0.024810075759887695, -0.023976802825927734, -0.023143529891967773, -0.022310256958007812, -0.02147698402404785, -0.02064371109008789, -0.01981043815612793, -0.01897716522216797, -0.018143892288208008, -0.017310619354248047, -0.016477346420288086, -0.015644073486328125, -0.014810800552368164, -0.013977527618408203, -0.013144254684448242, -0.012310981750488281, -0.01147770881652832, -0.01064443588256836, -0.009811162948608398, -0.008977890014648438, -0.008144617080688477, -0.007311344146728516, -0.006478071212768555, -0.005644798278808594, -0.004811525344848633, -0.003978252410888672, -0.003144979476928711, -0.00231170654296875, -0.001478433609008789, -0.0006451606750488281, 0.0001881122589111328, 0.0010213851928710938, 0.0018546581268310547, 0.0026879310607910156, 0.0035212039947509766, 0.0043544769287109375, 0.0051877498626708984, 0.006021022796630859, 0.00685429573059082, 0.007687568664550781, 0.008520841598510742, 0.009354114532470703, 0.010187387466430664, 0.011020660400390625, 0.011853933334350586, 0.012687206268310547, 0.013520479202270508, 0.014353752136230469, 0.01518702507019043, 0.01602029800415039, 0.01685357093811035, 0.017686843872070312, 0.018520116806030273, 0.019353389739990234, 0.020186662673950195, 0.021019935607910156, 0.021853208541870117, 0.022686481475830078, 0.02351975440979004, 0.02435302734375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 15.0, 159.0, 508.0, 291.0, 39.0, 4.0, 1.0], "bins": [-0.007772545330226421, -0.0076423571445047855, -0.00751216895878315, -0.007381980773061514, -0.007251792587339878, -0.007121603935956955, -0.006991415750235319, -0.006861227564513683, -0.0067310393787920475, -0.006600851193070412, -0.006470663007348776, -0.00634047482162714, -0.006210286170244217, -0.006080097984522581, -0.005949909798800945, -0.0058197216130793095, -0.005689533427357674, -0.005559345241636038, -0.005429157055914402, -0.005298968870192766, -0.00516878068447113, -0.005038592033088207, -0.004908403847366571, -0.004778215661644936, -0.0046480274759233, -0.004517839290201664, -0.004387651104480028, -0.004257462918758392, -0.004127274267375469, -0.003997086081653833, -0.0038668978959321976, -0.0037367097102105618, -0.0036065219901502132, -0.0034763338044285774, -0.0033461456187069416, -0.003215957200154662, -0.0030857690144330263, -0.0029555808287113905, -0.002825392410159111, -0.002695204224437475, -0.0025650160387158394, -0.0024348278529942036, -0.0023046396672725677, -0.0021744512487202883, -0.0020442630629986525, -0.0019140748772770166, -0.001783886575140059, -0.0016536982730031013, -0.0015235100872814655, -0.0013933219015598297, -0.001263133599422872, -0.0011329452972859144, -0.0010027571115642786, -0.0008725688676349819, -0.0007423806237056851, -0.0006121923797763884, -0.00048200407763943076, -0.00035181583371013403, -0.0002216275897808373, -9.143934585154057e-05, 3.8748898077756166e-05, 0.0001689371420070529, 0.00029912538593634963, 0.00042931362986564636, 0.0005595018737949431]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 6.0, 10.0, 5.0, 12.0, 16.0, 17.0, 15.0, 19.0, 22.0, 33.0, 19.0, 32.0, 34.0, 33.0, 25.0, 30.0, 41.0, 31.0, 37.0, 48.0, 30.0, 35.0, 30.0, 35.0, 36.0, 43.0, 42.0, 33.0, 26.0, 22.0, 24.0, 27.0, 18.0, 12.0, 16.0, 8.0, 11.0, 9.0, 11.0, 13.0, 4.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000517725944519043, -0.0005003409460186958, -0.0004829559475183487, -0.00046557094901800156, -0.0004481859505176544, -0.0004308009520173073, -0.00041341595351696014, -0.000396030955016613, -0.00037864595651626587, -0.00036126095801591873, -0.0003438759595155716, -0.00032649096101522446, -0.0003091059625148773, -0.0002917209640145302, -0.00027433596551418304, -0.0002569509670138359, -0.00023956596851348877, -0.00022218097001314163, -0.0002047959715127945, -0.00018741097301244736, -0.00017002597451210022, -0.00015264097601175308, -0.00013525597751140594, -0.00011787097901105881, -0.00010048598051071167, -8.310098201036453e-05, -6.57159835100174e-05, -4.833098500967026e-05, -3.094598650932312e-05, -1.3560988008975983e-05, 3.824010491371155e-06, 2.1209008991718292e-05, 3.859400749206543e-05, 5.597900599241257e-05, 7.33640044927597e-05, 9.074900299310684e-05, 0.00010813400149345398, 0.00012551899999380112, 0.00014290399849414825, 0.0001602889969944954, 0.00017767399549484253, 0.00019505899399518967, 0.0002124439924955368, 0.00022982899099588394, 0.0002472139894962311, 0.0002645989879965782, 0.00028198398649692535, 0.0002993689849972725, 0.00031675398349761963, 0.00033413898199796677, 0.0003515239804983139, 0.00036890897899866104, 0.0003862939774990082, 0.0004036789759993553, 0.00042106397449970245, 0.0004384489730000496, 0.00045583397150039673, 0.00047321897000074387, 0.000490603968501091, 0.0005079889670014381, 0.0005253739655017853, 0.0005427589640021324, 0.0005601439625024796, 0.0005775289610028267, 0.0005949139595031738]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 8.0, 10.0, 9.0, 9.0, 13.0, 18.0, 24.0, 19.0, 35.0, 25.0, 33.0, 37.0, 42.0, 37.0, 43.0, 48.0, 42.0, 47.0, 48.0, 60.0, 51.0, 56.0, 34.0, 49.0, 25.0, 28.0, 29.0, 23.0, 21.0, 15.0, 12.0, 9.0, 7.0, 10.0, 12.0, 8.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.7679443359375, -5.551513671875, -5.3350830078125, -5.11865234375, -4.9022216796875, -4.685791015625, -4.4693603515625, -4.2529296875, -4.0364990234375, -3.820068359375, -3.6036376953125, -3.38720703125, -3.1707763671875, -2.954345703125, -2.7379150390625, -2.521484375, -2.3050537109375, -2.088623046875, -1.8721923828125, -1.65576171875, -1.4393310546875, -1.222900390625, -1.0064697265625, -0.7900390625, -0.5736083984375, -0.357177734375, -0.1407470703125, 0.07568359375, 0.2921142578125, 0.508544921875, 0.7249755859375, 0.94140625, 1.1578369140625, 1.374267578125, 1.5906982421875, 1.80712890625, 2.0235595703125, 2.239990234375, 2.4564208984375, 2.6728515625, 2.8892822265625, 3.105712890625, 3.3221435546875, 3.53857421875, 3.7550048828125, 3.971435546875, 4.1878662109375, 4.404296875, 4.6207275390625, 4.837158203125, 5.0535888671875, 5.27001953125, 5.4864501953125, 5.702880859375, 5.9193115234375, 6.1357421875, 6.3521728515625, 6.568603515625, 6.7850341796875, 7.00146484375, 7.2178955078125, 7.434326171875, 7.6507568359375, 7.8671875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 13.0, 10.0, 21.0, 32.0, 39.0, 75.0, 116.0, 169.0, 353.0, 611.0, 1292.0, 3405.0, 9194.0, 28635.0, 94740.0, 306959.0, 405852.0, 135334.0, 40707.0, 12989.0, 4509.0, 1754.0, 729.0, 408.0, 226.0, 126.0, 79.0, 61.0, 34.0, 32.0, 13.0, 7.0, 13.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5546875, -8.296630859375, -8.03857421875, -7.780517578125, -7.5224609375, -7.264404296875, -7.00634765625, -6.748291015625, -6.490234375, -6.232177734375, -5.97412109375, -5.716064453125, -5.4580078125, -5.199951171875, -4.94189453125, -4.683837890625, -4.42578125, -4.167724609375, -3.90966796875, -3.651611328125, -3.3935546875, -3.135498046875, -2.87744140625, -2.619384765625, -2.361328125, -2.103271484375, -1.84521484375, -1.587158203125, -1.3291015625, -1.071044921875, -0.81298828125, -0.554931640625, -0.296875, -0.038818359375, 0.21923828125, 0.477294921875, 0.7353515625, 0.993408203125, 1.25146484375, 1.509521484375, 1.767578125, 2.025634765625, 2.28369140625, 2.541748046875, 2.7998046875, 3.057861328125, 3.31591796875, 3.573974609375, 3.83203125, 4.090087890625, 4.34814453125, 4.606201171875, 4.8642578125, 5.122314453125, 5.38037109375, 5.638427734375, 5.896484375, 6.154541015625, 6.41259765625, 6.670654296875, 6.9287109375, 7.186767578125, 7.44482421875, 7.702880859375, 7.9609375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 6.0, 11.0, 5.0, 10.0, 18.0, 20.0, 23.0, 19.0, 29.0, 25.0, 27.0, 27.0, 39.0, 53.0, 43.0, 51.0, 84.0, 192.0, 1447.0, 310.0, 140.0, 65.0, 62.0, 45.0, 41.0, 36.0, 46.0, 37.0, 24.0, 15.0, 23.0, 13.0, 5.0, 11.0, 8.0, 18.0, 2.0, 9.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.9375, -20.279296875, -19.62109375, -18.962890625, -18.3046875, -17.646484375, -16.98828125, -16.330078125, -15.671875, -15.013671875, -14.35546875, -13.697265625, -13.0390625, -12.380859375, -11.72265625, -11.064453125, -10.40625, -9.748046875, -9.08984375, -8.431640625, -7.7734375, -7.115234375, -6.45703125, -5.798828125, -5.140625, -4.482421875, -3.82421875, -3.166015625, -2.5078125, -1.849609375, -1.19140625, -0.533203125, 0.125, 0.783203125, 1.44140625, 2.099609375, 2.7578125, 3.416015625, 4.07421875, 4.732421875, 5.390625, 6.048828125, 6.70703125, 7.365234375, 8.0234375, 8.681640625, 9.33984375, 9.998046875, 10.65625, 11.314453125, 11.97265625, 12.630859375, 13.2890625, 13.947265625, 14.60546875, 15.263671875, 15.921875, 16.580078125, 17.23828125, 17.896484375, 18.5546875, 19.212890625, 19.87109375, 20.529296875, 21.1875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 10.0, 11.0, 28.0, 23.0, 46.0, 65.0, 83.0, 111.0, 215.0, 420.0, 1224.0, 36865.0, 3101728.0, 3465.0, 642.0, 257.0, 182.0, 102.0, 69.0, 53.0, 23.0, 22.0, 17.0, 13.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-122.6875, -119.3935546875, -116.099609375, -112.8056640625, -109.51171875, -106.2177734375, -102.923828125, -99.6298828125, -96.3359375, -93.0419921875, -89.748046875, -86.4541015625, -83.16015625, -79.8662109375, -76.572265625, -73.2783203125, -69.984375, -66.6904296875, -63.396484375, -60.1025390625, -56.80859375, -53.5146484375, -50.220703125, -46.9267578125, -43.6328125, -40.3388671875, -37.044921875, -33.7509765625, -30.45703125, -27.1630859375, -23.869140625, -20.5751953125, -17.28125, -13.9873046875, -10.693359375, -7.3994140625, -4.10546875, -0.8115234375, 2.482421875, 5.7763671875, 9.0703125, 12.3642578125, 15.658203125, 18.9521484375, 22.24609375, 25.5400390625, 28.833984375, 32.1279296875, 35.421875, 38.7158203125, 42.009765625, 45.3037109375, 48.59765625, 51.8916015625, 55.185546875, 58.4794921875, 61.7734375, 65.0673828125, 68.361328125, 71.6552734375, 74.94921875, 78.2431640625, 81.537109375, 84.8310546875, 88.125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 17.0, 31.0, 39.0, 51.0, 88.0, 108.0, 129.0, 130.0, 99.0, 107.0, 70.0, 66.0, 27.0, 20.0, 6.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.224462509155273, -24.33256721496582, -23.440671920776367, -22.548778533935547, -21.656883239746094, -20.76498794555664, -19.873092651367188, -18.981197357177734, -18.08930206298828, -17.197406768798828, -16.305511474609375, -15.413617134094238, -14.521722793579102, -13.629827499389648, -12.737932205200195, -11.846036911010742, -10.954143524169922, -10.062248229980469, -9.170353889465332, -8.278458595275879, -7.386563777923584, -6.494668960571289, -5.602773666381836, -4.710878849029541, -3.818984031677246, -2.927089214324951, -2.035194158554077, -1.1432991027832031, -0.2514042854309082, 0.6404905319213867, 1.5323858261108398, 2.4242806434631348, 3.316173553466797, 4.208068370819092, 5.099963188171387, 5.99185848236084, 6.883753299713135, 7.77564811706543, 8.667543411254883, 9.559438705444336, 10.451333045959473, 11.343228340148926, 12.235122680664062, 13.127017974853516, 14.018913269042969, 14.910807609558105, 15.802702903747559, 16.694597244262695, 17.58649253845215, 18.4783878326416, 19.370283126831055, 20.262176513671875, 21.154071807861328, 22.04596710205078, 22.937862396240234, 23.829757690429688, 24.72165298461914, 25.613548278808594, 26.505443572998047, 27.3973388671875, 28.28923225402832, 29.181127548217773, 30.073022842407227, 30.96491813659668, 31.8568115234375]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 8.0, 10.0, 7.0, 10.0, 9.0, 13.0, 20.0, 17.0, 22.0, 15.0, 26.0, 22.0, 27.0, 44.0, 26.0, 42.0, 35.0, 38.0, 46.0, 28.0, 33.0, 51.0, 51.0, 30.0, 31.0, 44.0, 34.0, 25.0, 21.0, 28.0, 26.0, 24.0, 19.0, 21.0, 18.0, 19.0, 11.0, 9.0, 9.0, 7.0, 6.0, 3.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-43.384952545166016, -41.89735794067383, -40.40976333618164, -38.92216873168945, -37.434574127197266, -35.94697952270508, -34.45938491821289, -32.9717903137207, -31.484195709228516, -29.996601104736328, -28.50900650024414, -27.021411895751953, -25.533817291259766, -24.046222686767578, -22.55862808227539, -21.071033477783203, -19.583438873291016, -18.095844268798828, -16.60824966430664, -15.120655059814453, -13.633060455322266, -12.145465850830078, -10.65787124633789, -9.170276641845703, -7.682682037353516, -6.195087432861328, -4.707492828369141, -3.219898223876953, -1.7323036193847656, -0.24470901489257812, 1.2428855895996094, 2.730480194091797, 4.218074798583984, 5.705669403076172, 7.193264007568359, 8.680858612060547, 10.168453216552734, 11.656047821044922, 13.14364242553711, 14.631237030029297, 16.118831634521484, 17.606426239013672, 19.09402084350586, 20.581615447998047, 22.069210052490234, 23.556804656982422, 25.04439926147461, 26.531993865966797, 28.019588470458984, 29.507183074951172, 30.99477767944336, 32.48237228393555, 33.969966888427734, 35.45756149291992, 36.94515609741211, 38.4327507019043, 39.920345306396484, 41.40793991088867, 42.89553451538086, 44.38312911987305, 45.870723724365234, 47.35831832885742, 48.84591293334961, 50.3335075378418, 51.821102142333984]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 12.0, 10.0, 13.0, 22.0, 14.0, 19.0, 25.0, 29.0, 34.0, 41.0, 32.0, 30.0, 48.0, 33.0, 47.0, 51.0, 62.0, 58.0, 50.0, 42.0, 50.0, 34.0, 49.0, 31.0, 28.0, 28.0, 16.0, 19.0, 14.0, 11.0, 13.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.223388671875, -5.98583984375, -5.748291015625, -5.5107421875, -5.273193359375, -5.03564453125, -4.798095703125, -4.560546875, -4.322998046875, -4.08544921875, -3.847900390625, -3.6103515625, -3.372802734375, -3.13525390625, -2.897705078125, -2.66015625, -2.422607421875, -2.18505859375, -1.947509765625, -1.7099609375, -1.472412109375, -1.23486328125, -0.997314453125, -0.759765625, -0.522216796875, -0.28466796875, -0.047119140625, 0.1904296875, 0.427978515625, 0.66552734375, 0.903076171875, 1.140625, 1.378173828125, 1.61572265625, 1.853271484375, 2.0908203125, 2.328369140625, 2.56591796875, 2.803466796875, 3.041015625, 3.278564453125, 3.51611328125, 3.753662109375, 3.9912109375, 4.228759765625, 4.46630859375, 4.703857421875, 4.94140625, 5.178955078125, 5.41650390625, 5.654052734375, 5.8916015625, 6.129150390625, 6.36669921875, 6.604248046875, 6.841796875, 7.079345703125, 7.31689453125, 7.554443359375, 7.7919921875, 8.029541015625, 8.26708984375, 8.504638671875, 8.7421875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 15.0, 10.0, 17.0, 22.0, 42.0, 39.0, 40.0, 45.0, 71.0, 81.0, 124.0, 167.0, 373.0, 977.0, 4206.0, 36560.0, 486669.0, 2438500.0, 1118283.0, 96809.0, 8442.0, 1478.0, 470.0, 250.0, 148.0, 85.0, 78.0, 47.0, 38.0, 35.0, 20.0, 30.0, 22.0, 17.0, 14.0, 8.0, 13.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.328125, -12.863525390625, -12.39892578125, -11.934326171875, -11.4697265625, -11.005126953125, -10.54052734375, -10.075927734375, -9.611328125, -9.146728515625, -8.68212890625, -8.217529296875, -7.7529296875, -7.288330078125, -6.82373046875, -6.359130859375, -5.89453125, -5.429931640625, -4.96533203125, -4.500732421875, -4.0361328125, -3.571533203125, -3.10693359375, -2.642333984375, -2.177734375, -1.713134765625, -1.24853515625, -0.783935546875, -0.3193359375, 0.145263671875, 0.60986328125, 1.074462890625, 1.5390625, 2.003662109375, 2.46826171875, 2.932861328125, 3.3974609375, 3.862060546875, 4.32666015625, 4.791259765625, 5.255859375, 5.720458984375, 6.18505859375, 6.649658203125, 7.1142578125, 7.578857421875, 8.04345703125, 8.508056640625, 8.97265625, 9.437255859375, 9.90185546875, 10.366455078125, 10.8310546875, 11.295654296875, 11.76025390625, 12.224853515625, 12.689453125, 13.154052734375, 13.61865234375, 14.083251953125, 14.5478515625, 15.012451171875, 15.47705078125, 15.941650390625, 16.40625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 12.0, 13.0, 17.0, 38.0, 38.0, 43.0, 65.0, 77.0, 143.0, 179.0, 294.0, 365.0, 484.0, 523.0, 462.0, 413.0, 269.0, 210.0, 128.0, 72.0, 52.0, 47.0, 38.0, 20.0, 21.0, 15.0, 6.0, 8.0, 6.0, 5.0, 6.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.546875, -12.09130859375, -11.6357421875, -11.18017578125, -10.724609375, -10.26904296875, -9.8134765625, -9.35791015625, -8.90234375, -8.44677734375, -7.9912109375, -7.53564453125, -7.080078125, -6.62451171875, -6.1689453125, -5.71337890625, -5.2578125, -4.80224609375, -4.3466796875, -3.89111328125, -3.435546875, -2.97998046875, -2.5244140625, -2.06884765625, -1.61328125, -1.15771484375, -0.7021484375, -0.24658203125, 0.208984375, 0.66455078125, 1.1201171875, 1.57568359375, 2.03125, 2.48681640625, 2.9423828125, 3.39794921875, 3.853515625, 4.30908203125, 4.7646484375, 5.22021484375, 5.67578125, 6.13134765625, 6.5869140625, 7.04248046875, 7.498046875, 7.95361328125, 8.4091796875, 8.86474609375, 9.3203125, 9.77587890625, 10.2314453125, 10.68701171875, 11.142578125, 11.59814453125, 12.0537109375, 12.50927734375, 12.96484375, 13.42041015625, 13.8759765625, 14.33154296875, 14.787109375, 15.24267578125, 15.6982421875, 16.15380859375, 16.609375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 5.0, 4.0, 8.0, 9.0, 12.0, 11.0, 28.0, 40.0, 50.0, 51.0, 93.0, 137.0, 245.0, 381.0, 825.0, 45158.0, 4115479.0, 29888.0, 745.0, 393.0, 249.0, 154.0, 81.0, 67.0, 45.0, 45.0, 27.0, 17.0, 15.0, 6.0, 10.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.6484375, -74.546875, -72.4453125, -70.34375, -68.2421875, -66.140625, -64.0390625, -61.9375, -59.8359375, -57.734375, -55.6328125, -53.53125, -51.4296875, -49.328125, -47.2265625, -45.125, -43.0234375, -40.921875, -38.8203125, -36.71875, -34.6171875, -32.515625, -30.4140625, -28.3125, -26.2109375, -24.109375, -22.0078125, -19.90625, -17.8046875, -15.703125, -13.6015625, -11.5, -9.3984375, -7.296875, -5.1953125, -3.09375, -0.9921875, 1.109375, 3.2109375, 5.3125, 7.4140625, 9.515625, 11.6171875, 13.71875, 15.8203125, 17.921875, 20.0234375, 22.125, 24.2265625, 26.328125, 28.4296875, 30.53125, 32.6328125, 34.734375, 36.8359375, 38.9375, 41.0390625, 43.140625, 45.2421875, 47.34375, 49.4453125, 51.546875, 53.6484375, 55.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 15.0, 107.0, 355.0, 382.0, 135.0, 21.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.03279876708984, -76.68462371826172, -70.33644104003906, -63.98826599121094, -57.64009094238281, -51.29191589355469, -44.9437370300293, -38.595558166503906, -32.24738311767578, -25.899206161499023, -19.551029205322266, -13.202852249145508, -6.85467529296875, -0.5064983367919922, 5.841678619384766, 12.189857482910156, 18.53803253173828, 24.88620948791504, 31.234386444091797, 37.58256530761719, 43.93074035644531, 50.27891540527344, 56.62709426879883, 62.97527313232422, 69.32344818115234, 75.67162322998047, 82.01980590820312, 88.36798095703125, 94.71615600585938, 101.0643310546875, 107.41250610351562, 113.76068878173828, 120.10885620117188, 126.45703125, 132.80520629882812, 139.15338134765625, 145.50155639648438, 151.84974670410156, 158.1979217529297, 164.5460968017578, 170.89427185058594, 177.24244689941406, 183.5906219482422, 189.9387969970703, 196.2869873046875, 202.63516235351562, 208.98333740234375, 215.33151245117188, 221.6796875, 228.02786254882812, 234.37603759765625, 240.72421264648438, 247.0723876953125, 253.4205780029297, 259.76873779296875, 266.116943359375, 272.465087890625, 278.8132629394531, 285.16143798828125, 291.5096130371094, 297.8577880859375, 304.2059631347656, 310.55413818359375, 316.90234375, 323.2505187988281]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 8.0, 9.0, 9.0, 8.0, 10.0, 18.0, 23.0, 26.0, 23.0, 31.0, 22.0, 35.0, 38.0, 32.0, 38.0, 42.0, 28.0, 42.0, 34.0, 49.0, 38.0, 46.0, 30.0, 36.0, 39.0, 32.0, 32.0, 28.0, 25.0, 22.0, 31.0, 13.0, 20.0, 10.0, 13.0, 10.0, 11.0, 7.0, 2.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.16272735595703, -31.94219970703125, -30.721670150756836, -29.501142501831055, -28.280614852905273, -27.06008529663086, -25.839557647705078, -24.619029998779297, -23.398502349853516, -22.177974700927734, -20.95744514465332, -19.73691749572754, -18.516389846801758, -17.295860290527344, -16.075332641601562, -14.854804992675781, -13.634275436401367, -12.41374683380127, -11.193219184875488, -9.97269058227539, -8.75216293334961, -7.531634330749512, -6.311105728149414, -5.090578079223633, -3.870049476623535, -2.6495213508605957, -1.4289929866790771, -0.2084646224975586, 1.0120635032653809, 2.2325916290283203, 3.453120231628418, 4.673647880554199, 5.894176483154297, 7.114704608917236, 8.335232734680176, 9.555761337280273, 10.776288986206055, 11.996817588806152, 13.21734619140625, 14.437873840332031, 15.658402442932129, 16.878931045532227, 18.099458694458008, 19.319988250732422, 20.540515899658203, 21.761043548583984, 22.981571197509766, 24.202098846435547, 25.42262840270996, 26.643156051635742, 27.863685607910156, 29.084213256835938, 30.30474090576172, 31.5252685546875, 32.74579620361328, 33.96632385253906, 35.18685531616211, 36.40738296508789, 37.62791061401367, 38.84844207763672, 40.0689697265625, 41.28949737548828, 42.51002502441406, 43.730552673339844, 44.951080322265625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 7.0, 9.0, 10.0, 8.0, 11.0, 16.0, 20.0, 23.0, 22.0, 42.0, 27.0, 36.0, 51.0, 47.0, 40.0, 44.0, 44.0, 59.0, 42.0, 44.0, 43.0, 41.0, 30.0, 57.0, 31.0, 23.0, 27.0, 24.0, 19.0, 18.0, 18.0, 13.0, 13.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33984375, -6.1270751953125, -5.914306640625, -5.7015380859375, -5.48876953125, -5.2760009765625, -5.063232421875, -4.8504638671875, -4.6376953125, -4.4249267578125, -4.212158203125, -3.9993896484375, -3.78662109375, -3.5738525390625, -3.361083984375, -3.1483154296875, -2.935546875, -2.7227783203125, -2.510009765625, -2.2972412109375, -2.08447265625, -1.8717041015625, -1.658935546875, -1.4461669921875, -1.2333984375, -1.0206298828125, -0.807861328125, -0.5950927734375, -0.38232421875, -0.1695556640625, 0.043212890625, 0.2559814453125, 0.46875, 0.6815185546875, 0.894287109375, 1.1070556640625, 1.31982421875, 1.5325927734375, 1.745361328125, 1.9581298828125, 2.1708984375, 2.3836669921875, 2.596435546875, 2.8092041015625, 3.02197265625, 3.2347412109375, 3.447509765625, 3.6602783203125, 3.873046875, 4.0858154296875, 4.298583984375, 4.5113525390625, 4.72412109375, 4.9368896484375, 5.149658203125, 5.3624267578125, 5.5751953125, 5.7879638671875, 6.000732421875, 6.2135009765625, 6.42626953125, 6.6390380859375, 6.851806640625, 7.0645751953125, 7.27734375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 8.0, 7.0, 6.0, 11.0, 20.0, 27.0, 34.0, 50.0, 96.0, 125.0, 152.0, 235.0, 320.0, 454.0, 667.0, 993.0, 1514.0, 2129.0, 3085.0, 4600.0, 6753.0, 10237.0, 15179.0, 22716.0, 34503.0, 53355.0, 83043.0, 128209.0, 177811.0, 168302.0, 116096.0, 74945.0, 48178.0, 31375.0, 20674.0, 13846.0, 9463.0, 6175.0, 4092.0, 2803.0, 1912.0, 1374.0, 954.0, 600.0, 419.0, 300.0, 206.0, 140.0, 110.0, 76.0, 58.0, 45.0, 20.0, 14.0, 21.0, 13.0, 1.0, 9.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.40185546875, -0.3888435363769531, -0.37583160400390625, -0.3628196716308594, -0.3498077392578125, -0.3367958068847656, -0.32378387451171875, -0.3107719421386719, -0.297760009765625, -0.2847480773925781, -0.27173614501953125, -0.2587242126464844, -0.2457122802734375, -0.23270034790039062, -0.21968841552734375, -0.20667648315429688, -0.19366455078125, -0.18065261840820312, -0.16764068603515625, -0.15462875366210938, -0.1416168212890625, -0.12860488891601562, -0.11559295654296875, -0.10258102416992188, -0.089569091796875, -0.07655715942382812, -0.06354522705078125, -0.050533294677734375, -0.0375213623046875, -0.024509429931640625, -0.01149749755859375, 0.001514434814453125, 0.0145263671875, 0.027538299560546875, 0.04055023193359375, 0.053562164306640625, 0.0665740966796875, 0.07958602905273438, 0.09259796142578125, 0.10560989379882812, 0.118621826171875, 0.13163375854492188, 0.14464569091796875, 0.15765762329101562, 0.1706695556640625, 0.18368148803710938, 0.19669342041015625, 0.20970535278320312, 0.22271728515625, 0.23572921752929688, 0.24874114990234375, 0.2617530822753906, 0.2747650146484375, 0.2877769470214844, 0.30078887939453125, 0.3138008117675781, 0.326812744140625, 0.3398246765136719, 0.35283660888671875, 0.3658485412597656, 0.3788604736328125, 0.3918724060058594, 0.40488433837890625, 0.4178962707519531, 0.430908203125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 7.0, 12.0, 7.0, 12.0, 10.0, 10.0, 8.0, 14.0, 16.0, 20.0, 29.0, 18.0, 26.0, 21.0, 44.0, 35.0, 41.0, 38.0, 42.0, 39.0, 1066.0, 38.0, 41.0, 35.0, 34.0, 43.0, 37.0, 25.0, 41.0, 29.0, 30.0, 26.0, 22.0, 20.0, 21.0, 15.0, 8.0, 11.0, 5.0, 7.0, 2.0, 2.0, 2.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.47332763671875, -3.3529052734375, -3.23248291015625, -3.112060546875, -2.99163818359375, -2.8712158203125, -2.75079345703125, -2.63037109375, -2.50994873046875, -2.3895263671875, -2.26910400390625, -2.148681640625, -2.02825927734375, -1.9078369140625, -1.78741455078125, -1.6669921875, -1.54656982421875, -1.4261474609375, -1.30572509765625, -1.185302734375, -1.06488037109375, -0.9444580078125, -0.82403564453125, -0.70361328125, -0.58319091796875, -0.4627685546875, -0.34234619140625, -0.221923828125, -0.10150146484375, 0.0189208984375, 0.13934326171875, 0.259765625, 0.38018798828125, 0.5006103515625, 0.62103271484375, 0.741455078125, 0.86187744140625, 0.9822998046875, 1.10272216796875, 1.22314453125, 1.34356689453125, 1.4639892578125, 1.58441162109375, 1.704833984375, 1.82525634765625, 1.9456787109375, 2.06610107421875, 2.1865234375, 2.30694580078125, 2.4273681640625, 2.54779052734375, 2.668212890625, 2.78863525390625, 2.9090576171875, 3.02947998046875, 3.14990234375, 3.27032470703125, 3.3907470703125, 3.51116943359375, 3.631591796875, 3.75201416015625, 3.8724365234375, 3.99285888671875, 4.11328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 15.0, 11.0, 12.0, 17.0, 35.0, 52.0, 93.0, 117.0, 158.0, 239.0, 314.0, 493.0, 727.0, 1028.0, 1400.0, 2124.0, 2934.0, 4316.0, 6134.0, 8946.0, 12722.0, 17912.0, 26065.0, 37977.0, 55498.0, 80954.0, 114855.0, 440824.0, 901668.0, 116469.0, 81699.0, 55875.0, 38222.0, 26399.0, 18523.0, 12599.0, 8839.0, 6369.0, 4433.0, 3096.0, 2166.0, 1509.0, 1038.0, 682.0, 492.0, 366.0, 229.0, 152.0, 112.0, 65.0, 50.0, 38.0, 29.0, 16.0, 18.0, 5.0, 2.0, 4.0, 3.0, 2.0], "bins": [-0.323486328125, -0.3133811950683594, -0.30327606201171875, -0.2931709289550781, -0.2830657958984375, -0.2729606628417969, -0.26285552978515625, -0.2527503967285156, -0.242645263671875, -0.23254013061523438, -0.22243499755859375, -0.21232986450195312, -0.2022247314453125, -0.19211959838867188, -0.18201446533203125, -0.17190933227539062, -0.16180419921875, -0.15169906616210938, -0.14159393310546875, -0.13148880004882812, -0.1213836669921875, -0.11127853393554688, -0.10117340087890625, -0.09106826782226562, -0.080963134765625, -0.07085800170898438, -0.06075286865234375, -0.050647735595703125, -0.0405426025390625, -0.030437469482421875, -0.02033233642578125, -0.010227203369140625, -0.0001220703125, 0.009983062744140625, 0.02008819580078125, 0.030193328857421875, 0.0402984619140625, 0.050403594970703125, 0.06050872802734375, 0.07061386108398438, 0.080718994140625, 0.09082412719726562, 0.10092926025390625, 0.11103439331054688, 0.1211395263671875, 0.13124465942382812, 0.14134979248046875, 0.15145492553710938, 0.16156005859375, 0.17166519165039062, 0.18177032470703125, 0.19187545776367188, 0.2019805908203125, 0.21208572387695312, 0.22219085693359375, 0.23229598999023438, 0.242401123046875, 0.2525062561035156, 0.26261138916015625, 0.2727165222167969, 0.2828216552734375, 0.2929267883300781, 0.30303192138671875, 0.3131370544433594, 0.3232421875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 7.0, 12.0, 6.0, 7.0, 18.0, 19.0, 22.0, 30.0, 29.0, 43.0, 52.0, 51.0, 57.0, 60.0, 54.0, 56.0, 50.0, 62.0, 52.0, 44.0, 47.0, 34.0, 33.0, 36.0, 20.0, 13.0, 14.0, 14.0, 8.0, 8.0, 5.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001148223876953125, -0.001107737421989441, -0.0010672509670257568, -0.0010267645120620728, -0.0009862780570983887, -0.0009457916021347046, -0.0009053051471710205, -0.0008648186922073364, -0.0008243322372436523, -0.0007838457822799683, -0.0007433593273162842, -0.0007028728723526001, -0.000662386417388916, -0.0006218999624252319, -0.0005814135074615479, -0.0005409270524978638, -0.0005004405975341797, -0.0004599541425704956, -0.0004194676876068115, -0.00037898123264312744, -0.00033849477767944336, -0.0002980083227157593, -0.0002575218677520752, -0.0002170354127883911, -0.00017654895782470703, -0.00013606250286102295, -9.557604789733887e-05, -5.5089592933654785e-05, -1.4603137969970703e-05, 2.588331699371338e-05, 6.636977195739746e-05, 0.00010685622692108154, 0.00014734268188476562, 0.0001878291368484497, 0.0002283155918121338, 0.00026880204677581787, 0.00030928850173950195, 0.00034977495670318604, 0.0003902614116668701, 0.0004307478666305542, 0.0004712343215942383, 0.0005117207765579224, 0.0005522072315216064, 0.0005926936864852905, 0.0006331801414489746, 0.0006736665964126587, 0.0007141530513763428, 0.0007546395063400269, 0.0007951259613037109, 0.000835612416267395, 0.0008760988712310791, 0.0009165853261947632, 0.0009570717811584473, 0.0009975582361221313, 0.0010380446910858154, 0.0010785311460494995, 0.0011190176010131836, 0.0011595040559768677, 0.0011999905109405518, 0.0012404769659042358, 0.00128096342086792, 0.001321449875831604, 0.001361936330795288, 0.0014024227857589722, 0.0014429092407226562]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 8.0, 8.0, 8.0, 10.0, 19.0, 24.0, 31.0, 34.0, 56.0, 57.0, 98.0, 130.0, 204.0, 427.0, 1436.0, 422944.0, 620195.0, 1668.0, 435.0, 220.0, 145.0, 93.0, 56.0, 49.0, 39.0, 35.0, 28.0, 15.0, 10.0, 11.0, 12.0, 10.0, 6.0, 4.0, 3.0, 6.0, 0.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.032379150390625, -0.03150486946105957, -0.03063058853149414, -0.02975630760192871, -0.02888202667236328, -0.02800774574279785, -0.027133464813232422, -0.026259183883666992, -0.025384902954101562, -0.024510622024536133, -0.023636341094970703, -0.022762060165405273, -0.021887779235839844, -0.021013498306274414, -0.020139217376708984, -0.019264936447143555, -0.018390655517578125, -0.017516374588012695, -0.016642093658447266, -0.015767812728881836, -0.014893531799316406, -0.014019250869750977, -0.013144969940185547, -0.012270689010620117, -0.011396408081054688, -0.010522127151489258, -0.009647846221923828, -0.008773565292358398, -0.007899284362792969, -0.007025003433227539, -0.006150722503662109, -0.00527644157409668, -0.00440216064453125, -0.0035278797149658203, -0.0026535987854003906, -0.001779317855834961, -0.0009050369262695312, -3.075599670410156e-05, 0.0008435249328613281, 0.0017178058624267578, 0.0025920867919921875, 0.003466367721557617, 0.004340648651123047, 0.0052149295806884766, 0.006089210510253906, 0.006963491439819336, 0.007837772369384766, 0.008712053298950195, 0.009586334228515625, 0.010460615158081055, 0.011334896087646484, 0.012209177017211914, 0.013083457946777344, 0.013957738876342773, 0.014832019805908203, 0.015706300735473633, 0.016580581665039062, 0.017454862594604492, 0.018329143524169922, 0.01920342445373535, 0.02007770538330078, 0.02095198631286621, 0.02182626724243164, 0.02270054817199707, 0.0235748291015625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 356.0, 661.0], "bins": [-0.0279895830899477, -0.02754577435553074, -0.027101963758468628, -0.026658155024051666, -0.026214346289634705, -0.025770535692572594, -0.025326726958155632, -0.02488291636109352, -0.02443910762667656, -0.023995298892259598, -0.023551488295197487, -0.023107679560780525, -0.022663868963718414, -0.022220060229301453, -0.02177625149488449, -0.02133244089782238, -0.02088863216340542, -0.020444823428988457, -0.020001012831926346, -0.019557204097509384, -0.019113395363092422, -0.01866958476603031, -0.01822577603161335, -0.01778196543455124, -0.017338156700134277, -0.016894347965717316, -0.016450537368655205, -0.016006728634238243, -0.015562918968498707, -0.01511910930275917, -0.014675300568342209, -0.014231490902602673, -0.013787681236863136, -0.0133438715711236, -0.012900061905384064, -0.012456253170967102, -0.012012443505227566, -0.01156863383948803, -0.011124825105071068, -0.010681015439331532, -0.010237205773591995, -0.009793396107852459, -0.009349586442112923, -0.008905777707695961, -0.008461968041956425, -0.008018158376216888, -0.0075743491761386395, -0.0071305399760603905, -0.006686730310320854, -0.006242920644581318, -0.005799111444503069, -0.00535530224442482, -0.004911492578685284, -0.004467682912945747, -0.004023873712867498, -0.0035800642799586058, -0.003136254847049713, -0.0026924454141408205, -0.002248635981231928, -0.0018048265483230352, -0.0013610171154141426, -0.00091720768250525, -0.00047339824959635735, -2.9588816687464714e-05, 0.0004142206453252584]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 7.0, 3.0, 6.0, 5.0, 12.0, 13.0, 25.0, 20.0, 25.0, 34.0, 31.0, 42.0, 56.0, 57.0, 55.0, 47.0, 60.0, 64.0, 60.0, 50.0, 36.0, 45.0, 37.0, 42.0, 27.0, 39.0, 33.0, 12.0, 16.0, 16.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005998015403747559, -0.0005710385739803314, -0.000542275607585907, -0.0005135126411914825, -0.0004847496747970581, -0.00045598670840263367, -0.00042722374200820923, -0.0003984607756137848, -0.00036969780921936035, -0.0003409348428249359, -0.0003121718764305115, -0.00028340891003608704, -0.0002546459436416626, -0.00022588297724723816, -0.00019712001085281372, -0.00016835704445838928, -0.00013959407806396484, -0.0001108311116695404, -8.206814527511597e-05, -5.330517888069153e-05, -2.454221248626709e-05, 4.220753908157349e-06, 3.298372030258179e-05, 6.174668669700623e-05, 9.050965309143066e-05, 0.0001192726194858551, 0.00014803558588027954, 0.00017679855227470398, 0.00020556151866912842, 0.00023432448506355286, 0.0002630874514579773, 0.00029185041785240173, 0.00032061338424682617, 0.0003493763506412506, 0.00037813931703567505, 0.0004069022834300995, 0.0004356652498245239, 0.00046442821621894836, 0.0004931911826133728, 0.0005219541490077972, 0.0005507171154022217, 0.0005794800817966461, 0.0006082430481910706, 0.000637006014585495, 0.0006657689809799194, 0.0006945319473743439, 0.0007232949137687683, 0.0007520578801631927, 0.0007808208465576172, 0.0008095838129520416, 0.0008383467793464661, 0.0008671097457408905, 0.0008958727121353149, 0.0009246356785297394, 0.0009533986449241638, 0.0009821616113185883, 0.0010109245777130127, 0.0010396875441074371, 0.0010684505105018616, 0.001097213476896286, 0.0011259764432907104, 0.0011547394096851349, 0.0011835023760795593, 0.0012122653424739838, 0.0012410283088684082]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 7.0, 9.0, 10.0, 8.0, 11.0, 16.0, 20.0, 23.0, 22.0, 42.0, 27.0, 36.0, 51.0, 47.0, 40.0, 44.0, 44.0, 59.0, 42.0, 44.0, 43.0, 41.0, 30.0, 57.0, 31.0, 23.0, 27.0, 24.0, 19.0, 18.0, 18.0, 13.0, 13.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33984375, -6.1270751953125, -5.914306640625, -5.7015380859375, -5.48876953125, -5.2760009765625, -5.063232421875, -4.8504638671875, -4.6376953125, -4.4249267578125, -4.212158203125, -3.9993896484375, -3.78662109375, -3.5738525390625, -3.361083984375, -3.1483154296875, -2.935546875, -2.7227783203125, -2.510009765625, -2.2972412109375, -2.08447265625, -1.8717041015625, -1.658935546875, -1.4461669921875, -1.2333984375, -1.0206298828125, -0.807861328125, -0.5950927734375, -0.38232421875, -0.1695556640625, 0.043212890625, 0.2559814453125, 0.46875, 0.6815185546875, 0.894287109375, 1.1070556640625, 1.31982421875, 1.5325927734375, 1.745361328125, 1.9581298828125, 2.1708984375, 2.3836669921875, 2.596435546875, 2.8092041015625, 3.02197265625, 3.2347412109375, 3.447509765625, 3.6602783203125, 3.873046875, 4.0858154296875, 4.298583984375, 4.5113525390625, 4.72412109375, 4.9368896484375, 5.149658203125, 5.3624267578125, 5.5751953125, 5.7879638671875, 6.000732421875, 6.2135009765625, 6.42626953125, 6.6390380859375, 6.851806640625, 7.0645751953125, 7.27734375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 11.0, 11.0, 14.0, 22.0, 39.0, 40.0, 60.0, 91.0, 137.0, 254.0, 482.0, 991.0, 2105.0, 4293.0, 8760.0, 18017.0, 39115.0, 98200.0, 263284.0, 354660.0, 152265.0, 57362.0, 24824.0, 11880.0, 5794.0, 2839.0, 1399.0, 684.0, 364.0, 188.0, 112.0, 74.0, 51.0, 29.0, 32.0, 19.0, 11.0, 12.0, 9.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.2890625, -6.0809326171875, -5.872802734375, -5.6646728515625, -5.45654296875, -5.2484130859375, -5.040283203125, -4.8321533203125, -4.6240234375, -4.4158935546875, -4.207763671875, -3.9996337890625, -3.79150390625, -3.5833740234375, -3.375244140625, -3.1671142578125, -2.958984375, -2.7508544921875, -2.542724609375, -2.3345947265625, -2.12646484375, -1.9183349609375, -1.710205078125, -1.5020751953125, -1.2939453125, -1.0858154296875, -0.877685546875, -0.6695556640625, -0.46142578125, -0.2532958984375, -0.045166015625, 0.1629638671875, 0.37109375, 0.5792236328125, 0.787353515625, 0.9954833984375, 1.20361328125, 1.4117431640625, 1.619873046875, 1.8280029296875, 2.0361328125, 2.2442626953125, 2.452392578125, 2.6605224609375, 2.86865234375, 3.0767822265625, 3.284912109375, 3.4930419921875, 3.701171875, 3.9093017578125, 4.117431640625, 4.3255615234375, 4.53369140625, 4.7418212890625, 4.949951171875, 5.1580810546875, 5.3662109375, 5.5743408203125, 5.782470703125, 5.9906005859375, 6.19873046875, 6.4068603515625, 6.614990234375, 6.8231201171875, 7.03125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 8.0, 13.0, 7.0, 8.0, 17.0, 28.0, 27.0, 28.0, 29.0, 34.0, 38.0, 49.0, 62.0, 99.0, 150.0, 397.0, 1425.0, 164.0, 92.0, 57.0, 59.0, 31.0, 34.0, 36.0, 23.0, 34.0, 21.0, 14.0, 9.0, 11.0, 11.0, 2.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.609375, -27.7919921875, -26.974609375, -26.1572265625, -25.33984375, -24.5224609375, -23.705078125, -22.8876953125, -22.0703125, -21.2529296875, -20.435546875, -19.6181640625, -18.80078125, -17.9833984375, -17.166015625, -16.3486328125, -15.53125, -14.7138671875, -13.896484375, -13.0791015625, -12.26171875, -11.4443359375, -10.626953125, -9.8095703125, -8.9921875, -8.1748046875, -7.357421875, -6.5400390625, -5.72265625, -4.9052734375, -4.087890625, -3.2705078125, -2.453125, -1.6357421875, -0.818359375, -0.0009765625, 0.81640625, 1.6337890625, 2.451171875, 3.2685546875, 4.0859375, 4.9033203125, 5.720703125, 6.5380859375, 7.35546875, 8.1728515625, 8.990234375, 9.8076171875, 10.625, 11.4423828125, 12.259765625, 13.0771484375, 13.89453125, 14.7119140625, 15.529296875, 16.3466796875, 17.1640625, 17.9814453125, 18.798828125, 19.6162109375, 20.43359375, 21.2509765625, 22.068359375, 22.8857421875, 23.703125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 12.0, 11.0, 17.0, 20.0, 32.0, 38.0, 66.0, 84.0, 154.0, 215.0, 375.0, 890.0, 38517.0, 3099070.0, 4633.0, 645.0, 325.0, 174.0, 130.0, 78.0, 56.0, 45.0, 36.0, 20.0, 12.0, 14.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.4375, -82.7099609375, -79.982421875, -77.2548828125, -74.52734375, -71.7998046875, -69.072265625, -66.3447265625, -63.6171875, -60.8896484375, -58.162109375, -55.4345703125, -52.70703125, -49.9794921875, -47.251953125, -44.5244140625, -41.796875, -39.0693359375, -36.341796875, -33.6142578125, -30.88671875, -28.1591796875, -25.431640625, -22.7041015625, -19.9765625, -17.2490234375, -14.521484375, -11.7939453125, -9.06640625, -6.3388671875, -3.611328125, -0.8837890625, 1.84375, 4.5712890625, 7.298828125, 10.0263671875, 12.75390625, 15.4814453125, 18.208984375, 20.9365234375, 23.6640625, 26.3916015625, 29.119140625, 31.8466796875, 34.57421875, 37.3017578125, 40.029296875, 42.7568359375, 45.484375, 48.2119140625, 50.939453125, 53.6669921875, 56.39453125, 59.1220703125, 61.849609375, 64.5771484375, 67.3046875, 70.0322265625, 72.759765625, 75.4873046875, 78.21484375, 80.9423828125, 83.669921875, 86.3974609375, 89.125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [101.0, 853.0, 61.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.375727653503418, -4.142389297485352, 4.090949058532715, 12.324288368225098, 20.55762481689453, 28.79096221923828, 37.0243034362793, 45.25764083862305, 53.4909782409668, 61.72431564331055, 69.95765686035156, 78.19099426269531, 86.42433166503906, 94.65766906738281, 102.89100646972656, 111.12434387207031, 119.3576889038086, 127.59102630615234, 135.82437133789062, 144.05770874023438, 152.29104614257812, 160.52438354492188, 168.75772094726562, 176.99105834960938, 185.22439575195312, 193.45773315429688, 201.69107055664062, 209.92440795898438, 218.15774536132812, 226.39108276367188, 234.62442016601562, 242.85775756835938, 251.09109497070312, 259.3244323730469, 267.5577697753906, 275.7911071777344, 284.0244445800781, 292.2577819824219, 300.4911193847656, 308.7244567871094, 316.9577941894531, 325.1911315917969, 333.4244689941406, 341.6578063964844, 349.8911437988281, 358.1244812011719, 366.3578186035156, 374.5911560058594, 382.82452392578125, 391.057861328125, 399.29119873046875, 407.5245361328125, 415.75787353515625, 423.9912109375, 432.22454833984375, 440.4578857421875, 448.69122314453125, 456.924560546875, 465.15789794921875, 473.3912353515625, 481.62457275390625, 489.85791015625, 498.09124755859375, 506.3245849609375, 514.5579223632812]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 10.0, 9.0, 8.0, 15.0, 18.0, 14.0, 22.0, 12.0, 18.0, 12.0, 25.0, 26.0, 29.0, 28.0, 37.0, 38.0, 39.0, 45.0, 38.0, 26.0, 46.0, 35.0, 28.0, 40.0, 34.0, 31.0, 26.0, 38.0, 31.0, 30.0, 35.0, 14.0, 29.0, 20.0, 15.0, 14.0, 9.0, 13.0, 4.0, 6.0, 6.0, 9.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.27090835571289, -46.7557487487793, -45.2405891418457, -43.72542953491211, -42.21026611328125, -40.695106506347656, -39.17994689941406, -37.66478729248047, -36.149627685546875, -34.63446807861328, -33.11930847167969, -31.60414695739746, -30.088987350463867, -28.573827743530273, -27.058666229248047, -25.543506622314453, -24.02834701538086, -22.513187408447266, -20.998027801513672, -19.482866287231445, -17.96770668029785, -16.452547073364258, -14.937386512756348, -13.422225952148438, -11.907066345214844, -10.39190673828125, -8.87674617767334, -7.361586093902588, -5.846426010131836, -4.331265926361084, -2.816105842590332, -1.3009452819824219, 0.21421432495117188, 1.7293744087219238, 3.244534492492676, 4.759694576263428, 6.27485466003418, 7.790014743804932, 9.305174827575684, 10.820335388183594, 12.335494995117188, 13.850654602050781, 15.365815162658691, 16.8809757232666, 18.396135330200195, 19.91129493713379, 21.426456451416016, 22.94161605834961, 24.456775665283203, 25.971935272216797, 27.48709487915039, 29.002256393432617, 30.51741600036621, 32.03257751464844, 33.54773712158203, 35.062896728515625, 36.57805633544922, 38.09321594238281, 39.608375549316406, 41.12353515625, 42.638694763183594, 44.15385818481445, 45.66901779174805, 47.18417739868164, 48.699337005615234]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 2.0, 6.0, 7.0, 10.0, 10.0, 9.0, 14.0, 10.0, 19.0, 25.0, 21.0, 30.0, 33.0, 51.0, 38.0, 36.0, 24.0, 51.0, 42.0, 59.0, 38.0, 46.0, 38.0, 41.0, 39.0, 31.0, 44.0, 23.0, 29.0, 28.0, 26.0, 19.0, 15.0, 14.0, 17.0, 17.0, 7.0, 6.0, 12.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.2113037109375, -5.985107421875, -5.7589111328125, -5.53271484375, -5.3065185546875, -5.080322265625, -4.8541259765625, -4.6279296875, -4.4017333984375, -4.175537109375, -3.9493408203125, -3.72314453125, -3.4969482421875, -3.270751953125, -3.0445556640625, -2.818359375, -2.5921630859375, -2.365966796875, -2.1397705078125, -1.91357421875, -1.6873779296875, -1.461181640625, -1.2349853515625, -1.0087890625, -0.7825927734375, -0.556396484375, -0.3302001953125, -0.10400390625, 0.1221923828125, 0.348388671875, 0.5745849609375, 0.80078125, 1.0269775390625, 1.253173828125, 1.4793701171875, 1.70556640625, 1.9317626953125, 2.157958984375, 2.3841552734375, 2.6103515625, 2.8365478515625, 3.062744140625, 3.2889404296875, 3.51513671875, 3.7413330078125, 3.967529296875, 4.1937255859375, 4.419921875, 4.6461181640625, 4.872314453125, 5.0985107421875, 5.32470703125, 5.5509033203125, 5.777099609375, 6.0032958984375, 6.2294921875, 6.4556884765625, 6.681884765625, 6.9080810546875, 7.13427734375, 7.3604736328125, 7.586669921875, 7.8128662109375, 8.0390625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 15.0, 16.0, 13.0, 17.0, 34.0, 19.0, 36.0, 62.0, 69.0, 91.0, 126.0, 210.0, 342.0, 815.0, 3590.0, 49210.0, 1095016.0, 2735125.0, 293462.0, 13136.0, 1527.0, 483.0, 252.0, 161.0, 96.0, 73.0, 62.0, 44.0, 39.0, 26.0, 20.0, 22.0, 11.0, 7.0, 17.0, 9.0, 8.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.49609375, -16.8984375, -16.30078125, -15.703125, -15.10546875, -14.5078125, -13.91015625, -13.3125, -12.71484375, -12.1171875, -11.51953125, -10.921875, -10.32421875, -9.7265625, -9.12890625, -8.53125, -7.93359375, -7.3359375, -6.73828125, -6.140625, -5.54296875, -4.9453125, -4.34765625, -3.75, -3.15234375, -2.5546875, -1.95703125, -1.359375, -0.76171875, -0.1640625, 0.43359375, 1.03125, 1.62890625, 2.2265625, 2.82421875, 3.421875, 4.01953125, 4.6171875, 5.21484375, 5.8125, 6.41015625, 7.0078125, 7.60546875, 8.203125, 8.80078125, 9.3984375, 9.99609375, 10.59375, 11.19140625, 11.7890625, 12.38671875, 12.984375, 13.58203125, 14.1796875, 14.77734375, 15.375, 15.97265625, 16.5703125, 17.16796875, 17.765625, 18.36328125, 18.9609375, 19.55859375, 20.15625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 8.0, 7.0, 13.0, 11.0, 14.0, 26.0, 43.0, 54.0, 66.0, 87.0, 138.0, 222.0, 287.0, 406.0, 466.0, 518.0, 415.0, 357.0, 262.0, 195.0, 132.0, 89.0, 79.0, 56.0, 33.0, 29.0, 20.0, 14.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0859375, -13.6221923828125, -13.158447265625, -12.6947021484375, -12.23095703125, -11.7672119140625, -11.303466796875, -10.8397216796875, -10.3759765625, -9.9122314453125, -9.448486328125, -8.9847412109375, -8.52099609375, -8.0572509765625, -7.593505859375, -7.1297607421875, -6.666015625, -6.2022705078125, -5.738525390625, -5.2747802734375, -4.81103515625, -4.3472900390625, -3.883544921875, -3.4197998046875, -2.9560546875, -2.4923095703125, -2.028564453125, -1.5648193359375, -1.10107421875, -0.6373291015625, -0.173583984375, 0.2901611328125, 0.75390625, 1.2176513671875, 1.681396484375, 2.1451416015625, 2.60888671875, 3.0726318359375, 3.536376953125, 4.0001220703125, 4.4638671875, 4.9276123046875, 5.391357421875, 5.8551025390625, 6.31884765625, 6.7825927734375, 7.246337890625, 7.7100830078125, 8.173828125, 8.6375732421875, 9.101318359375, 9.5650634765625, 10.02880859375, 10.4925537109375, 10.956298828125, 11.4200439453125, 11.8837890625, 12.3475341796875, 12.811279296875, 13.2750244140625, 13.73876953125, 14.2025146484375, 14.666259765625, 15.1300048828125, 15.59375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 8.0, 3.0, 5.0, 6.0, 18.0, 14.0, 29.0, 39.0, 56.0, 71.0, 99.0, 152.0, 210.0, 355.0, 624.0, 6151.0, 3625400.0, 557827.0, 1781.0, 541.0, 289.0, 212.0, 111.0, 76.0, 64.0, 43.0, 32.0, 19.0, 11.0, 12.0, 12.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.9375, -67.8701171875, -65.802734375, -63.7353515625, -61.66796875, -59.6005859375, -57.533203125, -55.4658203125, -53.3984375, -51.3310546875, -49.263671875, -47.1962890625, -45.12890625, -43.0615234375, -40.994140625, -38.9267578125, -36.859375, -34.7919921875, -32.724609375, -30.6572265625, -28.58984375, -26.5224609375, -24.455078125, -22.3876953125, -20.3203125, -18.2529296875, -16.185546875, -14.1181640625, -12.05078125, -9.9833984375, -7.916015625, -5.8486328125, -3.78125, -1.7138671875, 0.353515625, 2.4208984375, 4.48828125, 6.5556640625, 8.623046875, 10.6904296875, 12.7578125, 14.8251953125, 16.892578125, 18.9599609375, 21.02734375, 23.0947265625, 25.162109375, 27.2294921875, 29.296875, 31.3642578125, 33.431640625, 35.4990234375, 37.56640625, 39.6337890625, 41.701171875, 43.7685546875, 45.8359375, 47.9033203125, 49.970703125, 52.0380859375, 54.10546875, 56.1728515625, 58.240234375, 60.3076171875, 62.375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 62.0, 367.0, 467.0, 106.0, 12.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.62886047363281, -69.0408706665039, -61.452880859375, -53.86488723754883, -46.27689743041992, -38.688907623291016, -31.100914001464844, -23.512924194335938, -15.924934387207031, -8.336943626403809, -0.7489528656005859, 6.839038848876953, 14.42702865600586, 22.015018463134766, 29.603012084960938, 37.191001892089844, 44.77899169921875, 52.366981506347656, 59.95497131347656, 67.54296875, 75.13095092773438, 82.71894836425781, 90.30693817138672, 97.89492797851562, 105.48291778564453, 113.07090759277344, 120.65889739990234, 128.24688720703125, 135.8348846435547, 143.42286682128906, 151.0108642578125, 158.59884643554688, 166.18682861328125, 173.7748260498047, 181.36280822753906, 188.9508056640625, 196.53878784179688, 204.1267852783203, 211.71478271484375, 219.30276489257812, 226.8907470703125, 234.47874450683594, 242.0667266845703, 249.65472412109375, 257.2427062988281, 264.8306884765625, 272.418701171875, 280.0066833496094, 287.59466552734375, 295.1826477050781, 302.7706604003906, 310.358642578125, 317.9466247558594, 325.53460693359375, 333.12261962890625, 340.7106018066406, 348.2986145019531, 355.8865966796875, 363.474609375, 371.0625915527344, 378.65057373046875, 386.2385559082031, 393.8265686035156, 401.41455078125, 409.0025329589844]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 4.0, 7.0, 6.0, 8.0, 11.0, 8.0, 14.0, 18.0, 18.0, 23.0, 18.0, 33.0, 27.0, 38.0, 29.0, 39.0, 40.0, 39.0, 35.0, 32.0, 39.0, 55.0, 44.0, 33.0, 42.0, 37.0, 40.0, 32.0, 31.0, 26.0, 22.0, 23.0, 18.0, 19.0, 16.0, 13.0, 8.0, 7.0, 7.0, 10.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.74001693725586, -43.415733337402344, -42.09144592285156, -40.76716232299805, -39.44287872314453, -38.11859130859375, -36.794307708740234, -35.47002410888672, -34.14573669433594, -32.82145309448242, -31.497167587280273, -30.172882080078125, -28.84859848022461, -27.52431297302246, -26.200027465820312, -24.875743865966797, -23.55146026611328, -22.227174758911133, -20.902891159057617, -19.57860565185547, -18.254322052001953, -16.930036544799805, -15.605751037597656, -14.281466484069824, -12.957181930541992, -11.63289737701416, -10.308612823486328, -8.98432731628418, -7.660042762756348, -6.335758209228516, -5.011473178863525, -3.687188148498535, -2.3628997802734375, -1.0386149883270264, 0.28566980361938477, 1.609954595565796, 2.934239387512207, 4.258523941040039, 5.582808971405029, 6.9070940017700195, 8.231378555297852, 9.555663108825684, 10.879947662353516, 12.204233169555664, 13.528517723083496, 14.852802276611328, 16.177087783813477, 17.501373291015625, 18.82565689086914, 20.14994239807129, 21.474225997924805, 22.798511505126953, 24.12279510498047, 25.447080612182617, 26.771366119384766, 28.09564971923828, 29.41993522644043, 30.744220733642578, 32.068504333496094, 33.39278793334961, 34.71707534790039, 36.041358947753906, 37.36564254760742, 38.6899299621582, 40.01421356201172]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 11.0, 12.0, 16.0, 13.0, 12.0, 21.0, 29.0, 26.0, 32.0, 38.0, 33.0, 34.0, 42.0, 44.0, 48.0, 37.0, 47.0, 58.0, 49.0, 42.0, 43.0, 44.0, 37.0, 21.0, 26.0, 24.0, 24.0, 13.0, 22.0, 17.0, 17.0, 12.0, 7.0, 17.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.45703125, -7.24188232421875, -7.0267333984375, -6.81158447265625, -6.596435546875, -6.38128662109375, -6.1661376953125, -5.95098876953125, -5.73583984375, -5.52069091796875, -5.3055419921875, -5.09039306640625, -4.875244140625, -4.66009521484375, -4.4449462890625, -4.22979736328125, -4.0146484375, -3.79949951171875, -3.5843505859375, -3.36920166015625, -3.154052734375, -2.93890380859375, -2.7237548828125, -2.50860595703125, -2.29345703125, -2.07830810546875, -1.8631591796875, -1.64801025390625, -1.432861328125, -1.21771240234375, -1.0025634765625, -0.78741455078125, -0.572265625, -0.35711669921875, -0.1419677734375, 0.07318115234375, 0.288330078125, 0.50347900390625, 0.7186279296875, 0.93377685546875, 1.14892578125, 1.36407470703125, 1.5792236328125, 1.79437255859375, 2.009521484375, 2.22467041015625, 2.4398193359375, 2.65496826171875, 2.8701171875, 3.08526611328125, 3.3004150390625, 3.51556396484375, 3.730712890625, 3.94586181640625, 4.1610107421875, 4.37615966796875, 4.59130859375, 4.80645751953125, 5.0216064453125, 5.23675537109375, 5.451904296875, 5.66705322265625, 5.8822021484375, 6.09735107421875, 6.3125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 14.0, 11.0, 26.0, 38.0, 49.0, 74.0, 100.0, 149.0, 237.0, 325.0, 490.0, 711.0, 1076.0, 1552.0, 2193.0, 3509.0, 5023.0, 7573.0, 11442.0, 17476.0, 26631.0, 40192.0, 60999.0, 92166.0, 138853.0, 178494.0, 153339.0, 104069.0, 68644.0, 45024.0, 29419.0, 19762.0, 12790.0, 8563.0, 5677.0, 3885.0, 2552.0, 1731.0, 1188.0, 819.0, 530.0, 361.0, 241.0, 164.0, 128.0, 94.0, 54.0, 37.0, 21.0, 15.0, 11.0, 8.0, 7.0, 5.0, 4.0, 0.0, 2.0], "bins": [-0.4296875, -0.4165229797363281, -0.40335845947265625, -0.3901939392089844, -0.3770294189453125, -0.3638648986816406, -0.35070037841796875, -0.3375358581542969, -0.324371337890625, -0.3112068176269531, -0.29804229736328125, -0.2848777770996094, -0.2717132568359375, -0.2585487365722656, -0.24538421630859375, -0.23221969604492188, -0.21905517578125, -0.20589065551757812, -0.19272613525390625, -0.17956161499023438, -0.1663970947265625, -0.15323257446289062, -0.14006805419921875, -0.12690353393554688, -0.113739013671875, -0.10057449340820312, -0.08740997314453125, -0.07424545288085938, -0.0610809326171875, -0.047916412353515625, -0.03475189208984375, -0.021587371826171875, -0.0084228515625, 0.004741668701171875, 0.01790618896484375, 0.031070709228515625, 0.0442352294921875, 0.057399749755859375, 0.07056427001953125, 0.08372879028320312, 0.096893310546875, 0.11005783081054688, 0.12322235107421875, 0.13638687133789062, 0.1495513916015625, 0.16271591186523438, 0.17588043212890625, 0.18904495239257812, 0.20220947265625, 0.21537399291992188, 0.22853851318359375, 0.24170303344726562, 0.2548675537109375, 0.2680320739746094, 0.28119659423828125, 0.2943611145019531, 0.307525634765625, 0.3206901550292969, 0.33385467529296875, 0.3470191955566406, 0.3601837158203125, 0.3733482360839844, 0.38651275634765625, 0.3996772766113281, 0.412841796875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 7.0, 11.0, 14.0, 18.0, 20.0, 25.0, 30.0, 17.0, 33.0, 34.0, 34.0, 37.0, 39.0, 42.0, 35.0, 38.0, 1062.0, 58.0, 40.0, 36.0, 29.0, 37.0, 33.0, 33.0, 30.0, 24.0, 23.0, 12.0, 24.0, 25.0, 22.0, 20.0, 10.0, 7.0, 9.0, 5.0, 3.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.296875, -4.171051025390625, -4.04522705078125, -3.919403076171875, -3.7935791015625, -3.667755126953125, -3.54193115234375, -3.416107177734375, -3.290283203125, -3.164459228515625, -3.03863525390625, -2.912811279296875, -2.7869873046875, -2.661163330078125, -2.53533935546875, -2.409515380859375, -2.28369140625, -2.157867431640625, -2.03204345703125, -1.906219482421875, -1.7803955078125, -1.654571533203125, -1.52874755859375, -1.402923583984375, -1.277099609375, -1.151275634765625, -1.02545166015625, -0.899627685546875, -0.7738037109375, -0.647979736328125, -0.52215576171875, -0.396331787109375, -0.2705078125, -0.144683837890625, -0.01885986328125, 0.106964111328125, 0.2327880859375, 0.358612060546875, 0.48443603515625, 0.610260009765625, 0.736083984375, 0.861907958984375, 0.98773193359375, 1.113555908203125, 1.2393798828125, 1.365203857421875, 1.49102783203125, 1.616851806640625, 1.74267578125, 1.868499755859375, 1.99432373046875, 2.120147705078125, 2.2459716796875, 2.371795654296875, 2.49761962890625, 2.623443603515625, 2.749267578125, 2.875091552734375, 3.00091552734375, 3.126739501953125, 3.2525634765625, 3.378387451171875, 3.50421142578125, 3.630035400390625, 3.755859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 8.0, 13.0, 10.0, 14.0, 31.0, 30.0, 78.0, 96.0, 155.0, 198.0, 325.0, 504.0, 780.0, 1162.0, 1758.0, 2755.0, 4077.0, 6434.0, 10012.0, 15522.0, 24295.0, 37477.0, 58132.0, 90626.0, 137352.0, 1224580.0, 160375.0, 113310.0, 74219.0, 47532.0, 30391.0, 19555.0, 12564.0, 7990.0, 5104.0, 3338.0, 2193.0, 1453.0, 931.0, 614.0, 380.0, 261.0, 169.0, 111.0, 79.0, 50.0, 32.0, 25.0, 11.0, 12.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.421630859375, -0.40914154052734375, -0.3966522216796875, -0.38416290283203125, -0.371673583984375, -0.35918426513671875, -0.3466949462890625, -0.33420562744140625, -0.32171630859375, -0.30922698974609375, -0.2967376708984375, -0.28424835205078125, -0.271759033203125, -0.25926971435546875, -0.2467803955078125, -0.23429107666015625, -0.2218017578125, -0.20931243896484375, -0.1968231201171875, -0.18433380126953125, -0.171844482421875, -0.15935516357421875, -0.1468658447265625, -0.13437652587890625, -0.12188720703125, -0.10939788818359375, -0.0969085693359375, -0.08441925048828125, -0.071929931640625, -0.05944061279296875, -0.0469512939453125, -0.03446197509765625, -0.02197265625, -0.00948333740234375, 0.0030059814453125, 0.01549530029296875, 0.027984619140625, 0.04047393798828125, 0.0529632568359375, 0.06545257568359375, 0.07794189453125, 0.09043121337890625, 0.1029205322265625, 0.11540985107421875, 0.127899169921875, 0.14038848876953125, 0.1528778076171875, 0.16536712646484375, 0.1778564453125, 0.19034576416015625, 0.2028350830078125, 0.21532440185546875, 0.227813720703125, 0.24030303955078125, 0.2527923583984375, 0.26528167724609375, 0.27777099609375, 0.29026031494140625, 0.3027496337890625, 0.31523895263671875, 0.327728271484375, 0.34021759033203125, 0.3527069091796875, 0.36519622802734375, 0.377685546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 7.0, 10.0, 14.0, 34.0, 37.0, 34.0, 35.0, 62.0, 85.0, 91.0, 105.0, 107.0, 99.0, 58.0, 65.0, 45.0, 35.0, 20.0, 16.0, 7.0, 3.0, 9.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00237274169921875, -0.002306237816810608, -0.002239733934402466, -0.0021732300519943237, -0.0021067261695861816, -0.0020402222871780396, -0.0019737184047698975, -0.0019072145223617554, -0.0018407106399536133, -0.0017742067575454712, -0.001707702875137329, -0.001641198992729187, -0.001574695110321045, -0.0015081912279129028, -0.0014416873455047607, -0.0013751834630966187, -0.0013086795806884766, -0.0012421756982803345, -0.0011756718158721924, -0.0011091679334640503, -0.0010426640510559082, -0.0009761601686477661, -0.000909656286239624, -0.0008431524038314819, -0.0007766485214233398, -0.0007101446390151978, -0.0006436407566070557, -0.0005771368741989136, -0.0005106329917907715, -0.0004441291093826294, -0.0003776252269744873, -0.0003111213445663452, -0.0002446174621582031, -0.00017811357975006104, -0.00011160969734191895, -4.5105814933776855e-05, 2.1398067474365234e-05, 8.790194988250732e-05, 0.00015440583229064941, 0.0002209097146987915, 0.0002874135971069336, 0.0003539174795150757, 0.0004204213619232178, 0.00048692524433135986, 0.000553429126739502, 0.000619933009147644, 0.0006864368915557861, 0.0007529407739639282, 0.0008194446563720703, 0.0008859485387802124, 0.0009524524211883545, 0.0010189563035964966, 0.0010854601860046387, 0.0011519640684127808, 0.0012184679508209229, 0.001284971833229065, 0.001351475715637207, 0.0014179795980453491, 0.0014844834804534912, 0.0015509873628616333, 0.0016174912452697754, 0.0016839951276779175, 0.0017504990100860596, 0.0018170028924942017, 0.0018835067749023438]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 8.0, 11.0, 8.0, 20.0, 29.0, 41.0, 57.0, 84.0, 120.0, 270.0, 514.0, 13049.0, 1031862.0, 1562.0, 354.0, 164.0, 114.0, 88.0, 61.0, 35.0, 29.0, 13.0, 13.0, 4.0, 9.0, 3.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03778076171875, -0.036446571350097656, -0.03511238098144531, -0.03377819061279297, -0.032444000244140625, -0.03110980987548828, -0.029775619506835938, -0.028441429138183594, -0.02710723876953125, -0.025773048400878906, -0.024438858032226562, -0.02310466766357422, -0.021770477294921875, -0.02043628692626953, -0.019102096557617188, -0.017767906188964844, -0.0164337158203125, -0.015099525451660156, -0.013765335083007812, -0.012431144714355469, -0.011096954345703125, -0.009762763977050781, -0.008428573608398438, -0.007094383239746094, -0.00576019287109375, -0.004426002502441406, -0.0030918121337890625, -0.0017576217651367188, -0.000423431396484375, 0.0009107589721679688, 0.0022449493408203125, 0.0035791397094726562, 0.004913330078125, 0.006247520446777344, 0.0075817108154296875, 0.008915901184082031, 0.010250091552734375, 0.011584281921386719, 0.012918472290039062, 0.014252662658691406, 0.01558685302734375, 0.016921043395996094, 0.018255233764648438, 0.01958942413330078, 0.020923614501953125, 0.02225780487060547, 0.023591995239257812, 0.024926185607910156, 0.0262603759765625, 0.027594566345214844, 0.028928756713867188, 0.03026294708251953, 0.031597137451171875, 0.03293132781982422, 0.03426551818847656, 0.035599708557128906, 0.03693389892578125, 0.038268089294433594, 0.03960227966308594, 0.04093647003173828, 0.042270660400390625, 0.04360485076904297, 0.04493904113769531, 0.046273231506347656, 0.047607421875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 14.0, 61.0, 180.0, 303.0, 253.0, 130.0, 45.0, 18.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0028207041323184967, -0.0027498146519064903, -0.0026789249386638403, -0.002608035458251834, -0.002537145745009184, -0.0024662562645971775, -0.002395366784185171, -0.0023244773037731647, -0.0022535875905305147, -0.0021826981101185083, -0.0021118083968758583, -0.002040918916463852, -0.0019700294360518456, -0.0018991397228091955, -0.0018282502423971891, -0.001757360645569861, -0.0016864710487425327, -0.0016155814519152045, -0.0015446918550878763, -0.00147380237467587, -0.0014029127778485417, -0.0013320231810212135, -0.0012611337006092072, -0.001190244103781879, -0.0011193545069545507, -0.0010484649101272225, -0.0009775753132998943, -0.000906685832887888, -0.0008357962360605597, -0.0007649066392332315, -0.0006940171006135643, -0.000623127561993897, -0.0005522381979972124, -0.00048134863027371466, -0.0004104590625502169, -0.00033956949482671916, -0.0002686799271032214, -0.00019779035937972367, -0.00012690079165622592, -5.601125303655863e-05, 1.4878343790769577e-05, 8.576791151426733e-05, 0.00015665747923776507, 0.00022754704696126282, 0.00029843661468476057, 0.0003693261824082583, 0.00044021575013175607, 0.0005111052887514234, 0.0005819948855787516, 0.0006528844824060798, 0.0007237740210257471, 0.0007946635596454144, 0.0008655531564727426, 0.0009364427533000708, 0.0010073322337120771, 0.0010782218305394053, 0.0011491114273667336, 0.0012200010241940618, 0.00129089062102139, 0.0013617801014333963, 0.0014326696982607245, 0.0015035592950880527, 0.0015744487755000591, 0.0016453383723273873, 0.0017162279691547155]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 4.0, 5.0, 3.0, 6.0, 11.0, 19.0, 13.0, 12.0, 19.0, 23.0, 17.0, 17.0, 21.0, 35.0, 29.0, 34.0, 45.0, 43.0, 43.0, 46.0, 47.0, 35.0, 38.0, 49.0, 43.0, 38.0, 34.0, 28.0, 31.0, 30.0, 26.0, 27.0, 15.0, 16.0, 15.0, 18.0, 14.0, 9.0, 8.0, 8.0, 6.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006355047225952148, -0.0006129816174507141, -0.0005904585123062134, -0.0005679354071617126, -0.0005454123020172119, -0.0005228891968727112, -0.0005003660917282104, -0.0004778429865837097, -0.000455319881439209, -0.00043279677629470825, -0.0004102736711502075, -0.0003877505660057068, -0.00036522746086120605, -0.0003427043557167053, -0.0003201812505722046, -0.00029765814542770386, -0.0002751350402832031, -0.0002526119351387024, -0.00023008882999420166, -0.00020756572484970093, -0.0001850426197052002, -0.00016251951456069946, -0.00013999640941619873, -0.000117473304271698, -9.495019912719727e-05, -7.242709398269653e-05, -4.99039888381958e-05, -2.738088369369507e-05, -4.857778549194336e-06, 1.7665326595306396e-05, 4.018843173980713e-05, 6.271153688430786e-05, 8.52346420288086e-05, 0.00010775774717330933, 0.00013028085231781006, 0.0001528039574623108, 0.00017532706260681152, 0.00019785016775131226, 0.000220373272895813, 0.00024289637804031372, 0.00026541948318481445, 0.0002879425883293152, 0.0003104656934738159, 0.00033298879861831665, 0.0003555119037628174, 0.0003780350089073181, 0.00040055811405181885, 0.0004230812191963196, 0.0004456043243408203, 0.00046812742948532104, 0.0004906505346298218, 0.0005131736397743225, 0.0005356967449188232, 0.000558219850063324, 0.0005807429552078247, 0.0006032660603523254, 0.0006257891654968262, 0.0006483122706413269, 0.0006708353757858276, 0.0006933584809303284, 0.0007158815860748291, 0.0007384046912193298, 0.0007609277963638306, 0.0007834509015083313, 0.000805974006652832]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 11.0, 12.0, 16.0, 13.0, 12.0, 21.0, 29.0, 26.0, 32.0, 38.0, 33.0, 33.0, 43.0, 44.0, 48.0, 37.0, 47.0, 58.0, 49.0, 42.0, 43.0, 44.0, 37.0, 21.0, 26.0, 24.0, 24.0, 13.0, 22.0, 17.0, 17.0, 12.0, 7.0, 17.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.45703125, -7.24188232421875, -7.0267333984375, -6.81158447265625, -6.596435546875, -6.38128662109375, -6.1661376953125, -5.95098876953125, -5.73583984375, -5.52069091796875, -5.3055419921875, -5.09039306640625, -4.875244140625, -4.66009521484375, -4.4449462890625, -4.22979736328125, -4.0146484375, -3.79949951171875, -3.5843505859375, -3.36920166015625, -3.154052734375, -2.93890380859375, -2.7237548828125, -2.50860595703125, -2.29345703125, -2.07830810546875, -1.8631591796875, -1.64801025390625, -1.432861328125, -1.21771240234375, -1.0025634765625, -0.78741455078125, -0.572265625, -0.35711669921875, -0.1419677734375, 0.07318115234375, 0.288330078125, 0.50347900390625, 0.7186279296875, 0.93377685546875, 1.14892578125, 1.36407470703125, 1.5792236328125, 1.79437255859375, 2.009521484375, 2.22467041015625, 2.4398193359375, 2.65496826171875, 2.8701171875, 3.08526611328125, 3.3004150390625, 3.51556396484375, 3.730712890625, 3.94586181640625, 4.1610107421875, 4.37615966796875, 4.59130859375, 4.80645751953125, 5.0216064453125, 5.23675537109375, 5.451904296875, 5.66705322265625, 5.8822021484375, 6.09735107421875, 6.3125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 5.0, 4.0, 5.0, 17.0, 14.0, 27.0, 26.0, 35.0, 65.0, 68.0, 75.0, 129.0, 229.0, 399.0, 760.0, 1716.0, 4287.0, 10444.0, 26957.0, 67759.0, 166872.0, 358929.0, 239890.0, 101983.0, 40402.0, 16079.0, 6467.0, 2503.0, 1058.0, 506.0, 258.0, 121.0, 115.0, 73.0, 64.0, 59.0, 32.0, 30.0, 21.0, 29.0, 6.0, 14.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.65234375, -7.43194580078125, -7.2115478515625, -6.99114990234375, -6.770751953125, -6.55035400390625, -6.3299560546875, -6.10955810546875, -5.88916015625, -5.66876220703125, -5.4483642578125, -5.22796630859375, -5.007568359375, -4.78717041015625, -4.5667724609375, -4.34637451171875, -4.1259765625, -3.90557861328125, -3.6851806640625, -3.46478271484375, -3.244384765625, -3.02398681640625, -2.8035888671875, -2.58319091796875, -2.36279296875, -2.14239501953125, -1.9219970703125, -1.70159912109375, -1.481201171875, -1.26080322265625, -1.0404052734375, -0.82000732421875, -0.599609375, -0.37921142578125, -0.1588134765625, 0.06158447265625, 0.281982421875, 0.50238037109375, 0.7227783203125, 0.94317626953125, 1.16357421875, 1.38397216796875, 1.6043701171875, 1.82476806640625, 2.045166015625, 2.26556396484375, 2.4859619140625, 2.70635986328125, 2.9267578125, 3.14715576171875, 3.3675537109375, 3.58795166015625, 3.808349609375, 4.02874755859375, 4.2491455078125, 4.46954345703125, 4.68994140625, 4.91033935546875, 5.1307373046875, 5.35113525390625, 5.571533203125, 5.79193115234375, 6.0123291015625, 6.23272705078125, 6.453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 7.0, 5.0, 7.0, 5.0, 13.0, 6.0, 10.0, 10.0, 24.0, 22.0, 20.0, 22.0, 30.0, 39.0, 35.0, 35.0, 32.0, 57.0, 63.0, 142.0, 350.0, 1453.0, 174.0, 84.0, 57.0, 46.0, 42.0, 35.0, 37.0, 24.0, 15.0, 25.0, 13.0, 21.0, 14.0, 18.0, 8.0, 17.0, 2.0, 10.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -22.0224609375, -21.357421875, -20.6923828125, -20.02734375, -19.3623046875, -18.697265625, -18.0322265625, -17.3671875, -16.7021484375, -16.037109375, -15.3720703125, -14.70703125, -14.0419921875, -13.376953125, -12.7119140625, -12.046875, -11.3818359375, -10.716796875, -10.0517578125, -9.38671875, -8.7216796875, -8.056640625, -7.3916015625, -6.7265625, -6.0615234375, -5.396484375, -4.7314453125, -4.06640625, -3.4013671875, -2.736328125, -2.0712890625, -1.40625, -0.7412109375, -0.076171875, 0.5888671875, 1.25390625, 1.9189453125, 2.583984375, 3.2490234375, 3.9140625, 4.5791015625, 5.244140625, 5.9091796875, 6.57421875, 7.2392578125, 7.904296875, 8.5693359375, 9.234375, 9.8994140625, 10.564453125, 11.2294921875, 11.89453125, 12.5595703125, 13.224609375, 13.8896484375, 14.5546875, 15.2197265625, 15.884765625, 16.5498046875, 17.21484375, 17.8798828125, 18.544921875, 19.2099609375, 19.875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 10.0, 9.0, 12.0, 12.0, 28.0, 33.0, 31.0, 70.0, 77.0, 111.0, 190.0, 400.0, 1078.0, 7822.0, 3123815.0, 9844.0, 1067.0, 434.0, 206.0, 152.0, 76.0, 43.0, 35.0, 32.0, 32.0, 19.0, 17.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.5625, -101.443359375, -98.32421875, -95.205078125, -92.0859375, -88.966796875, -85.84765625, -82.728515625, -79.609375, -76.490234375, -73.37109375, -70.251953125, -67.1328125, -64.013671875, -60.89453125, -57.775390625, -54.65625, -51.537109375, -48.41796875, -45.298828125, -42.1796875, -39.060546875, -35.94140625, -32.822265625, -29.703125, -26.583984375, -23.46484375, -20.345703125, -17.2265625, -14.107421875, -10.98828125, -7.869140625, -4.75, -1.630859375, 1.48828125, 4.607421875, 7.7265625, 10.845703125, 13.96484375, 17.083984375, 20.203125, 23.322265625, 26.44140625, 29.560546875, 32.6796875, 35.798828125, 38.91796875, 42.037109375, 45.15625, 48.275390625, 51.39453125, 54.513671875, 57.6328125, 60.751953125, 63.87109375, 66.990234375, 70.109375, 73.228515625, 76.34765625, 79.466796875, 82.5859375, 85.705078125, 88.82421875, 91.943359375, 95.0625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 19.0, 165.0, 449.0, 316.0, 62.0, 4.0, 1.0, 0.0, 1.0], "bins": [-207.00746154785156, -203.4169464111328, -199.82643127441406, -196.2359161376953, -192.64540100097656, -189.0548858642578, -185.46437072753906, -181.8738555908203, -178.28334045410156, -174.6928253173828, -171.10231018066406, -167.5117950439453, -163.92127990722656, -160.3307647705078, -156.74024963378906, -153.1497344970703, -149.5592041015625, -145.96868896484375, -142.378173828125, -138.78765869140625, -135.1971435546875, -131.60662841796875, -128.01611328125, -124.42559814453125, -120.8350830078125, -117.24456787109375, -113.654052734375, -110.06353759765625, -106.4730224609375, -102.88250732421875, -99.2919921875, -95.70147705078125, -92.1109619140625, -88.52044677734375, -84.929931640625, -81.33941650390625, -77.7489013671875, -74.15838623046875, -70.56787109375, -66.97735595703125, -63.386837005615234, -59.796321868896484, -56.205806732177734, -52.61528778076172, -49.02477264404297, -45.43425750732422, -41.84374237060547, -38.25322723388672, -34.66271209716797, -31.07219696044922, -27.48168182373047, -23.891164779663086, -20.300649642944336, -16.710134506225586, -13.119617462158203, -9.529102325439453, -5.938587188720703, -2.348071575164795, 1.2424440383911133, 4.83296012878418, 8.42347526550293, 12.01399040222168, 15.604507446289062, 19.195022583007812, 22.785537719726562]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 7.0, 8.0, 9.0, 7.0, 9.0, 14.0, 13.0, 23.0, 18.0, 22.0, 19.0, 31.0, 27.0, 30.0, 31.0, 35.0, 43.0, 42.0, 46.0, 36.0, 38.0, 41.0, 53.0, 54.0, 37.0, 37.0, 36.0, 28.0, 32.0, 28.0, 22.0, 17.0, 16.0, 17.0, 17.0, 12.0, 15.0, 13.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-59.79783630371094, -58.027889251708984, -56.25794219970703, -54.48799514770508, -52.718048095703125, -50.948097229003906, -49.17815017700195, -47.408203125, -45.63825607299805, -43.868309020996094, -42.09836196899414, -40.32841491699219, -38.55846405029297, -36.78852081298828, -35.01856994628906, -33.24862289428711, -31.478675842285156, -29.708728790283203, -27.93878173828125, -26.168832778930664, -24.39888572692871, -22.628938674926758, -20.858989715576172, -19.08904266357422, -17.319095611572266, -15.549148559570312, -13.779200553894043, -12.009252548217773, -10.23930549621582, -8.469358444213867, -6.699410438537598, -4.929462432861328, -3.159515380859375, -1.3895678520202637, 0.38037967681884766, 2.150327205657959, 3.9202747344970703, 5.690221786499023, 7.460169792175293, 9.230117797851562, 11.000064849853516, 12.770011901855469, 14.539959907531738, 16.309907913208008, 18.07985496520996, 19.849802017211914, 21.6197509765625, 23.389698028564453, 25.159645080566406, 26.92959213256836, 28.699539184570312, 30.4694881439209, 32.23943328857422, 34.00938415527344, 35.77933120727539, 37.549278259277344, 39.3192253112793, 41.08917236328125, 42.8591194152832, 44.629066467285156, 46.399017333984375, 48.16896057128906, 49.93891143798828, 51.708858489990234, 53.47880554199219]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 2.0, 7.0, 8.0, 7.0, 10.0, 8.0, 19.0, 19.0, 23.0, 30.0, 27.0, 25.0, 36.0, 37.0, 43.0, 33.0, 46.0, 38.0, 52.0, 51.0, 44.0, 43.0, 42.0, 53.0, 44.0, 39.0, 25.0, 22.0, 25.0, 20.0, 24.0, 19.0, 16.0, 13.0, 15.0, 11.0, 10.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.75, -7.5040283203125, -7.258056640625, -7.0120849609375, -6.76611328125, -6.5201416015625, -6.274169921875, -6.0281982421875, -5.7822265625, -5.5362548828125, -5.290283203125, -5.0443115234375, -4.79833984375, -4.5523681640625, -4.306396484375, -4.0604248046875, -3.814453125, -3.5684814453125, -3.322509765625, -3.0765380859375, -2.83056640625, -2.5845947265625, -2.338623046875, -2.0926513671875, -1.8466796875, -1.6007080078125, -1.354736328125, -1.1087646484375, -0.86279296875, -0.6168212890625, -0.370849609375, -0.1248779296875, 0.12109375, 0.3670654296875, 0.613037109375, 0.8590087890625, 1.10498046875, 1.3509521484375, 1.596923828125, 1.8428955078125, 2.0888671875, 2.3348388671875, 2.580810546875, 2.8267822265625, 3.07275390625, 3.3187255859375, 3.564697265625, 3.8106689453125, 4.056640625, 4.3026123046875, 4.548583984375, 4.7945556640625, 5.04052734375, 5.2864990234375, 5.532470703125, 5.7784423828125, 6.0244140625, 6.2703857421875, 6.516357421875, 6.7623291015625, 7.00830078125, 7.2542724609375, 7.500244140625, 7.7462158203125, 7.9921875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 8.0, 12.0, 11.0, 15.0, 25.0, 32.0, 31.0, 30.0, 47.0, 66.0, 106.0, 99.0, 180.0, 319.0, 995.0, 8152.0, 247897.0, 3100914.0, 809707.0, 22795.0, 1676.0, 410.0, 202.0, 112.0, 86.0, 67.0, 56.0, 47.0, 38.0, 39.0, 20.0, 14.0, 15.0, 15.0, 11.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.984375, -22.28076171875, -21.5771484375, -20.87353515625, -20.169921875, -19.46630859375, -18.7626953125, -18.05908203125, -17.35546875, -16.65185546875, -15.9482421875, -15.24462890625, -14.541015625, -13.83740234375, -13.1337890625, -12.43017578125, -11.7265625, -11.02294921875, -10.3193359375, -9.61572265625, -8.912109375, -8.20849609375, -7.5048828125, -6.80126953125, -6.09765625, -5.39404296875, -4.6904296875, -3.98681640625, -3.283203125, -2.57958984375, -1.8759765625, -1.17236328125, -0.46875, 0.23486328125, 0.9384765625, 1.64208984375, 2.345703125, 3.04931640625, 3.7529296875, 4.45654296875, 5.16015625, 5.86376953125, 6.5673828125, 7.27099609375, 7.974609375, 8.67822265625, 9.3818359375, 10.08544921875, 10.7890625, 11.49267578125, 12.1962890625, 12.89990234375, 13.603515625, 14.30712890625, 15.0107421875, 15.71435546875, 16.41796875, 17.12158203125, 17.8251953125, 18.52880859375, 19.232421875, 19.93603515625, 20.6396484375, 21.34326171875, 22.046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 12.0, 14.0, 24.0, 15.0, 30.0, 47.0, 58.0, 90.0, 139.0, 213.0, 321.0, 456.0, 568.0, 583.0, 444.0, 343.0, 229.0, 139.0, 100.0, 61.0, 67.0, 35.0, 31.0, 18.0, 15.0, 8.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9296875, -14.4166259765625, -13.903564453125, -13.3905029296875, -12.87744140625, -12.3643798828125, -11.851318359375, -11.3382568359375, -10.8251953125, -10.3121337890625, -9.799072265625, -9.2860107421875, -8.77294921875, -8.2598876953125, -7.746826171875, -7.2337646484375, -6.720703125, -6.2076416015625, -5.694580078125, -5.1815185546875, -4.66845703125, -4.1553955078125, -3.642333984375, -3.1292724609375, -2.6162109375, -2.1031494140625, -1.590087890625, -1.0770263671875, -0.56396484375, -0.0509033203125, 0.462158203125, 0.9752197265625, 1.48828125, 2.0013427734375, 2.514404296875, 3.0274658203125, 3.54052734375, 4.0535888671875, 4.566650390625, 5.0797119140625, 5.5927734375, 6.1058349609375, 6.618896484375, 7.1319580078125, 7.64501953125, 8.1580810546875, 8.671142578125, 9.1842041015625, 9.697265625, 10.2103271484375, 10.723388671875, 11.2364501953125, 11.74951171875, 12.2625732421875, 12.775634765625, 13.2886962890625, 13.8017578125, 14.3148193359375, 14.827880859375, 15.3409423828125, 15.85400390625, 16.3670654296875, 16.880126953125, 17.3931884765625, 17.90625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 14.0, 17.0, 28.0, 35.0, 54.0, 68.0, 97.0, 165.0, 291.0, 479.0, 1477.0, 1449033.0, 2739366.0, 1869.0, 499.0, 289.0, 163.0, 97.0, 73.0, 49.0, 34.0, 24.0, 11.0, 17.0, 9.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.625, -90.953125, -88.28125, -85.609375, -82.9375, -80.265625, -77.59375, -74.921875, -72.25, -69.578125, -66.90625, -64.234375, -61.5625, -58.890625, -56.21875, -53.546875, -50.875, -48.203125, -45.53125, -42.859375, -40.1875, -37.515625, -34.84375, -32.171875, -29.5, -26.828125, -24.15625, -21.484375, -18.8125, -16.140625, -13.46875, -10.796875, -8.125, -5.453125, -2.78125, -0.109375, 2.5625, 5.234375, 7.90625, 10.578125, 13.25, 15.921875, 18.59375, 21.265625, 23.9375, 26.609375, 29.28125, 31.953125, 34.625, 37.296875, 39.96875, 42.640625, 45.3125, 47.984375, 50.65625, 53.328125, 56.0, 58.671875, 61.34375, 64.015625, 66.6875, 69.359375, 72.03125, 74.703125, 77.375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 41.0, 185.0, 395.0, 307.0, 76.0, 12.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.16845703125, -133.52442932128906, -127.88040924072266, -122.23638153076172, -116.59235382080078, -110.94833374023438, -105.30430603027344, -99.6602783203125, -94.01625061035156, -88.37222290039062, -82.72820281982422, -77.08417510986328, -71.44014739990234, -65.79612731933594, -60.152099609375, -54.50807189941406, -48.864051818847656, -43.220027923583984, -37.57600021362305, -31.931976318359375, -26.28795051574707, -20.643924713134766, -14.999900817871094, -9.355873107910156, -3.7118492126464844, 1.932176113128662, 7.576201438903809, 13.220226287841797, 18.8642520904541, 24.508277893066406, 30.152301788330078, 35.796329498291016, 41.44035339355469, 47.08437728881836, 52.7284049987793, 58.37242889404297, 64.0164566040039, 69.66047668457031, 75.30450439453125, 80.94853210449219, 86.59255981445312, 92.23658752441406, 97.88060760498047, 103.5246353149414, 109.16866302490234, 114.81268310546875, 120.45671081542969, 126.10073852539062, 131.7447509765625, 137.38877868652344, 143.03280639648438, 148.67681884765625, 154.3208465576172, 159.96487426757812, 165.60890197753906, 171.2529296875, 176.89695739746094, 182.54098510742188, 188.1850128173828, 193.82904052734375, 199.47305297851562, 205.11708068847656, 210.7611083984375, 216.40513610839844, 222.04916381835938]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 1.0, 9.0, 9.0, 19.0, 14.0, 20.0, 23.0, 32.0, 33.0, 28.0, 33.0, 33.0, 37.0, 39.0, 44.0, 50.0, 43.0, 55.0, 37.0, 40.0, 38.0, 34.0, 37.0, 34.0, 27.0, 25.0, 25.0, 33.0, 18.0, 22.0, 19.0, 14.0, 19.0, 14.0, 10.0, 6.0, 2.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.55462646484375, -44.15840530395508, -42.762184143066406, -41.365966796875, -39.96974563598633, -38.573524475097656, -37.177303314208984, -35.78108215332031, -34.384864807128906, -32.988643646240234, -31.592424392700195, -30.196203231811523, -28.799983978271484, -27.403762817382812, -26.00754165649414, -24.6113224029541, -23.21510124206543, -21.818880081176758, -20.42266082763672, -19.026439666748047, -17.630220413208008, -16.233999252319336, -14.83777904510498, -13.441558837890625, -12.04533863067627, -10.649118423461914, -9.252898216247559, -7.856677532196045, -6.4604573249816895, -5.064237117767334, -3.6680164337158203, -2.271796226501465, -0.8755760192871094, 0.5206443071365356, 1.9168646335601807, 3.3130850791931152, 4.709305286407471, 6.105525493621826, 7.50174617767334, 8.897966384887695, 10.29418659210205, 11.690406799316406, 13.086627006530762, 14.482847213745117, 15.879068374633789, 17.275287628173828, 18.6715087890625, 20.067729949951172, 21.46394920349121, 22.860170364379883, 24.256389617919922, 25.652610778808594, 27.048830032348633, 28.445051193237305, 29.841270446777344, 31.237491607666016, 32.63371276855469, 34.02993392944336, 35.42615509033203, 36.82237243652344, 38.21859359741211, 39.61481475830078, 41.01103591918945, 42.407257080078125, 43.80347442626953]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 9.0, 2.0, 12.0, 9.0, 14.0, 10.0, 19.0, 22.0, 25.0, 26.0, 33.0, 26.0, 35.0, 36.0, 38.0, 36.0, 38.0, 34.0, 38.0, 40.0, 41.0, 57.0, 44.0, 28.0, 43.0, 45.0, 22.0, 22.0, 32.0, 20.0, 19.0, 18.0, 17.0, 11.0, 18.0, 9.0, 11.0, 7.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.160888671875, -5.95068359375, -5.740478515625, -5.5302734375, -5.320068359375, -5.10986328125, -4.899658203125, -4.689453125, -4.479248046875, -4.26904296875, -4.058837890625, -3.8486328125, -3.638427734375, -3.42822265625, -3.218017578125, -3.0078125, -2.797607421875, -2.58740234375, -2.377197265625, -2.1669921875, -1.956787109375, -1.74658203125, -1.536376953125, -1.326171875, -1.115966796875, -0.90576171875, -0.695556640625, -0.4853515625, -0.275146484375, -0.06494140625, 0.145263671875, 0.35546875, 0.565673828125, 0.77587890625, 0.986083984375, 1.1962890625, 1.406494140625, 1.61669921875, 1.826904296875, 2.037109375, 2.247314453125, 2.45751953125, 2.667724609375, 2.8779296875, 3.088134765625, 3.29833984375, 3.508544921875, 3.71875, 3.928955078125, 4.13916015625, 4.349365234375, 4.5595703125, 4.769775390625, 4.97998046875, 5.190185546875, 5.400390625, 5.610595703125, 5.82080078125, 6.031005859375, 6.2412109375, 6.451416015625, 6.66162109375, 6.871826171875, 7.08203125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 11.0, 26.0, 26.0, 41.0, 66.0, 100.0, 125.0, 196.0, 358.0, 511.0, 716.0, 1011.0, 1584.0, 2476.0, 3780.0, 5815.0, 8438.0, 13235.0, 19889.0, 30221.0, 45207.0, 69180.0, 105217.0, 152964.0, 178592.0, 138199.0, 92022.0, 60778.0, 40173.0, 26217.0, 17337.0, 11697.0, 7589.0, 5025.0, 3294.0, 2212.0, 1435.0, 940.0, 634.0, 438.0, 262.0, 171.0, 120.0, 61.0, 54.0, 41.0, 20.0, 17.0, 12.0, 11.0, 8.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.46923828125, -0.4547309875488281, -0.44022369384765625, -0.4257164001464844, -0.4112091064453125, -0.3967018127441406, -0.38219451904296875, -0.3676872253417969, -0.353179931640625, -0.3386726379394531, -0.32416534423828125, -0.3096580505371094, -0.2951507568359375, -0.2806434631347656, -0.26613616943359375, -0.2516288757324219, -0.23712158203125, -0.22261428833007812, -0.20810699462890625, -0.19359970092773438, -0.1790924072265625, -0.16458511352539062, -0.15007781982421875, -0.13557052612304688, -0.121063232421875, -0.10655593872070312, -0.09204864501953125, -0.07754135131835938, -0.0630340576171875, -0.048526763916015625, -0.03401947021484375, -0.019512176513671875, -0.0050048828125, 0.009502410888671875, 0.02400970458984375, 0.038516998291015625, 0.0530242919921875, 0.06753158569335938, 0.08203887939453125, 0.09654617309570312, 0.111053466796875, 0.12556076049804688, 0.14006805419921875, 0.15457534790039062, 0.1690826416015625, 0.18358993530273438, 0.19809722900390625, 0.21260452270507812, 0.22711181640625, 0.24161911010742188, 0.25612640380859375, 0.2706336975097656, 0.2851409912109375, 0.2996482849121094, 0.31415557861328125, 0.3286628723144531, 0.343170166015625, 0.3576774597167969, 0.37218475341796875, 0.3866920471191406, 0.4011993408203125, 0.4157066345214844, 0.43021392822265625, 0.4447212219238281, 0.459228515625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 1.0, 5.0, 8.0, 7.0, 14.0, 17.0, 17.0, 20.0, 13.0, 18.0, 21.0, 28.0, 26.0, 25.0, 31.0, 28.0, 42.0, 29.0, 35.0, 53.0, 1064.0, 52.0, 29.0, 44.0, 46.0, 33.0, 35.0, 29.0, 34.0, 43.0, 31.0, 29.0, 20.0, 14.0, 17.0, 16.0, 11.0, 11.0, 11.0, 6.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.84375, -4.707489013671875, -4.57122802734375, -4.434967041015625, -4.2987060546875, -4.162445068359375, -4.02618408203125, -3.889923095703125, -3.753662109375, -3.617401123046875, -3.48114013671875, -3.344879150390625, -3.2086181640625, -3.072357177734375, -2.93609619140625, -2.799835205078125, -2.66357421875, -2.527313232421875, -2.39105224609375, -2.254791259765625, -2.1185302734375, -1.982269287109375, -1.84600830078125, -1.709747314453125, -1.573486328125, -1.437225341796875, -1.30096435546875, -1.164703369140625, -1.0284423828125, -0.892181396484375, -0.75592041015625, -0.619659423828125, -0.4833984375, -0.347137451171875, -0.21087646484375, -0.074615478515625, 0.0616455078125, 0.197906494140625, 0.33416748046875, 0.470428466796875, 0.606689453125, 0.742950439453125, 0.87921142578125, 1.015472412109375, 1.1517333984375, 1.287994384765625, 1.42425537109375, 1.560516357421875, 1.69677734375, 1.833038330078125, 1.96929931640625, 2.105560302734375, 2.2418212890625, 2.378082275390625, 2.51434326171875, 2.650604248046875, 2.786865234375, 2.923126220703125, 3.05938720703125, 3.195648193359375, 3.3319091796875, 3.468170166015625, 3.60443115234375, 3.740692138671875, 3.876953125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 8.0, 9.0, 14.0, 26.0, 37.0, 59.0, 101.0, 122.0, 215.0, 313.0, 480.0, 715.0, 1209.0, 1774.0, 2706.0, 4177.0, 6368.0, 10014.0, 15408.0, 23974.0, 36626.0, 57117.0, 88577.0, 134592.0, 1222597.0, 162208.0, 115555.0, 75332.0, 48445.0, 30949.0, 20477.0, 13167.0, 8365.0, 5315.0, 3512.0, 2287.0, 1538.0, 943.0, 623.0, 369.0, 289.0, 187.0, 102.0, 75.0, 66.0, 36.0, 15.0, 13.0, 4.0, 9.0, 9.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.43994140625, -0.4265327453613281, -0.41312408447265625, -0.3997154235839844, -0.3863067626953125, -0.3728981018066406, -0.35948944091796875, -0.3460807800292969, -0.332672119140625, -0.3192634582519531, -0.30585479736328125, -0.2924461364746094, -0.2790374755859375, -0.2656288146972656, -0.25222015380859375, -0.23881149291992188, -0.22540283203125, -0.21199417114257812, -0.19858551025390625, -0.18517684936523438, -0.1717681884765625, -0.15835952758789062, -0.14495086669921875, -0.13154220581054688, -0.118133544921875, -0.10472488403320312, -0.09131622314453125, -0.07790756225585938, -0.0644989013671875, -0.051090240478515625, -0.03768157958984375, -0.024272918701171875, -0.0108642578125, 0.002544403076171875, 0.01595306396484375, 0.029361724853515625, 0.0427703857421875, 0.056179046630859375, 0.06958770751953125, 0.08299636840820312, 0.096405029296875, 0.10981369018554688, 0.12322235107421875, 0.13663101196289062, 0.1500396728515625, 0.16344833374023438, 0.17685699462890625, 0.19026565551757812, 0.20367431640625, 0.21708297729492188, 0.23049163818359375, 0.24390029907226562, 0.2573089599609375, 0.2707176208496094, 0.28412628173828125, 0.2975349426269531, 0.310943603515625, 0.3243522644042969, 0.33776092529296875, 0.3511695861816406, 0.3645782470703125, 0.3779869079589844, 0.39139556884765625, 0.4048042297363281, 0.418212890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 5.0, 8.0, 13.0, 10.0, 12.0, 18.0, 22.0, 17.0, 34.0, 26.0, 30.0, 48.0, 39.0, 49.0, 47.0, 44.0, 63.0, 49.0, 59.0, 38.0, 47.0, 46.0, 33.0, 32.0, 30.0, 32.0, 37.0, 20.0, 19.0, 10.0, 9.0, 9.0, 8.0, 3.0, 6.0, 7.0, 2.0, 4.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001132965087890625, -0.00109119713306427, -0.001049429178237915, -0.00100766122341156, -0.0009658932685852051, -0.0009241253137588501, -0.0008823573589324951, -0.0008405894041061401, -0.0007988214492797852, -0.0007570534944534302, -0.0007152855396270752, -0.0006735175848007202, -0.0006317496299743652, -0.0005899816751480103, -0.0005482137203216553, -0.0005064457654953003, -0.0004646778106689453, -0.00042290985584259033, -0.00038114190101623535, -0.00033937394618988037, -0.0002976059913635254, -0.0002558380365371704, -0.00021407008171081543, -0.00017230212688446045, -0.00013053417205810547, -8.876621723175049e-05, -4.699826240539551e-05, -5.230307579040527e-06, 3.653764724731445e-05, 7.830560207366943e-05, 0.00012007355690002441, 0.0001618415117263794, 0.00020360946655273438, 0.00024537742137908936, 0.00028714537620544434, 0.0003289133310317993, 0.0003706812858581543, 0.0004124492406845093, 0.00045421719551086426, 0.0004959851503372192, 0.0005377531051635742, 0.0005795210599899292, 0.0006212890148162842, 0.0006630569696426392, 0.0007048249244689941, 0.0007465928792953491, 0.0007883608341217041, 0.0008301287889480591, 0.0008718967437744141, 0.000913664698600769, 0.000955432653427124, 0.000997200608253479, 0.001038968563079834, 0.001080736517906189, 0.001122504472732544, 0.001164272427558899, 0.001206040382385254, 0.0012478083372116089, 0.0012895762920379639, 0.0013313442468643188, 0.0013731122016906738, 0.0014148801565170288, 0.0014566481113433838, 0.0014984160661697388, 0.0015401840209960938]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 2.0, 1.0, 1.0, 7.0, 13.0, 6.0, 14.0, 20.0, 21.0, 28.0, 35.0, 52.0, 60.0, 89.0, 121.0, 180.0, 355.0, 970.0, 44058.0, 997890.0, 3198.0, 617.0, 266.0, 137.0, 99.0, 66.0, 57.0, 47.0, 36.0, 35.0, 16.0, 17.0, 10.0, 6.0, 11.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.036102294921875, -0.035079240798950195, -0.03405618667602539, -0.033033132553100586, -0.03201007843017578, -0.030987024307250977, -0.029963970184326172, -0.028940916061401367, -0.027917861938476562, -0.026894807815551758, -0.025871753692626953, -0.02484869956970215, -0.023825645446777344, -0.02280259132385254, -0.021779537200927734, -0.02075648307800293, -0.019733428955078125, -0.01871037483215332, -0.017687320709228516, -0.01666426658630371, -0.015641212463378906, -0.014618158340454102, -0.013595104217529297, -0.012572050094604492, -0.011548995971679688, -0.010525941848754883, -0.009502887725830078, -0.008479833602905273, -0.007456779479980469, -0.006433725357055664, -0.005410671234130859, -0.004387617111206055, -0.00336456298828125, -0.0023415088653564453, -0.0013184547424316406, -0.00029540061950683594, 0.0007276535034179688, 0.0017507076263427734, 0.002773761749267578, 0.003796815872192383, 0.0048198699951171875, 0.005842924118041992, 0.006865978240966797, 0.007889032363891602, 0.008912086486816406, 0.009935140609741211, 0.010958194732666016, 0.01198124885559082, 0.013004302978515625, 0.01402735710144043, 0.015050411224365234, 0.01607346534729004, 0.017096519470214844, 0.01811957359313965, 0.019142627716064453, 0.020165681838989258, 0.021188735961914062, 0.022211790084838867, 0.023234844207763672, 0.024257898330688477, 0.02528095245361328, 0.026304006576538086, 0.02732706069946289, 0.028350114822387695, 0.0293731689453125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 180.0, 720.0, 110.0, 2.0], "bins": [-0.013621442019939423, -0.013399799354374409, -0.01317815575748682, -0.012956513091921806, -0.012734870426356792, -0.012513226829469204, -0.01229158416390419, -0.012069941498339176, -0.011848297901451588, -0.011626655235886574, -0.011405011638998985, -0.011183368973433971, -0.010961726307868958, -0.010740082710981369, -0.010518440045416355, -0.010296797379851341, -0.010075154714286327, -0.009853512048721313, -0.009631868451833725, -0.009410225786268711, -0.009188583120703697, -0.008966939523816109, -0.008745296858251095, -0.008523654192686081, -0.008302010595798492, -0.008080367930233479, -0.00785872433334589, -0.007637081667780876, -0.007415438536554575, -0.007193795870989561, -0.00697215273976326, -0.006750510074198246, -0.006528867408633232, -0.006307224277406931, -0.006085581611841917, -0.005863938480615616, -0.005642295349389315, -0.005420652683824301, -0.005199009552598, -0.004977366887032986, -0.004755723290145397, -0.004534080158919096, -0.004312437493354082, -0.004090794362127781, -0.0038691514637321234, -0.003647508565336466, -0.0034258654341101646, -0.003204222535714507, -0.0029825796373188496, -0.002760936738923192, -0.002539293607696891, -0.0023176507093012333, -0.0020960078109055758, -0.0018743647960945964, -0.001652721781283617, -0.0014310788828879595, -0.001209435984492302, -0.0009877929696813226, -0.000766150071285665, -0.0005445070564746857, -0.0003228640998713672, -0.00010122114326804876, 0.0001204218715429306, 0.00034206476993858814, 0.0005637077847495675]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 3.0, 8.0, 7.0, 10.0, 11.0, 11.0, 15.0, 19.0, 20.0, 19.0, 22.0, 28.0, 29.0, 37.0, 33.0, 46.0, 50.0, 46.0, 53.0, 43.0, 45.0, 53.0, 45.0, 40.0, 45.0, 31.0, 32.0, 29.0, 26.0, 35.0, 21.0, 22.0, 18.0, 15.0, 5.0, 4.0, 8.0, 10.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000621795654296875, -0.0005951123312115669, -0.0005684290081262589, -0.0005417456850409508, -0.0005150623619556427, -0.0004883790388703346, -0.00046169571578502655, -0.0004350123926997185, -0.0004083290696144104, -0.0003816457465291023, -0.00035496242344379425, -0.0003282791003584862, -0.0003015957772731781, -0.00027491245418787, -0.00024822913110256195, -0.00022154580801725388, -0.0001948624849319458, -0.00016817916184663773, -0.00014149583876132965, -0.00011481251567602158, -8.81291925907135e-05, -6.144586950540543e-05, -3.476254642009735e-05, -8.079223334789276e-06, 1.86040997505188e-05, 4.5287422835826874e-05, 7.197074592113495e-05, 9.865406900644302e-05, 0.0001253373920917511, 0.00015202071517705917, 0.00017870403826236725, 0.00020538736134767532, 0.0002320706844329834, 0.0002587540075182915, 0.00028543733060359955, 0.0003121206536889076, 0.0003388039767742157, 0.0003654872998595238, 0.00039217062294483185, 0.0004188539460301399, 0.000445537269115448, 0.0004722205922007561, 0.0004989039152860641, 0.0005255872383713722, 0.0005522705614566803, 0.0005789538845419884, 0.0006056372076272964, 0.0006323205307126045, 0.0006590038537979126, 0.0006856871768832207, 0.0007123704999685287, 0.0007390538230538368, 0.0007657371461391449, 0.000792420469224453, 0.000819103792309761, 0.0008457871153950691, 0.0008724704384803772, 0.0008991537615656853, 0.0009258370846509933, 0.0009525204077363014, 0.0009792037308216095, 0.0010058870539069176, 0.0010325703769922256, 0.0010592537000775337, 0.0010859370231628418]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 9.0, 2.0, 12.0, 9.0, 14.0, 10.0, 19.0, 22.0, 25.0, 26.0, 33.0, 26.0, 35.0, 36.0, 38.0, 36.0, 38.0, 34.0, 38.0, 40.0, 41.0, 57.0, 44.0, 28.0, 43.0, 44.0, 23.0, 22.0, 32.0, 20.0, 19.0, 18.0, 17.0, 11.0, 18.0, 9.0, 11.0, 7.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.160888671875, -5.95068359375, -5.740478515625, -5.5302734375, -5.320068359375, -5.10986328125, -4.899658203125, -4.689453125, -4.479248046875, -4.26904296875, -4.058837890625, -3.8486328125, -3.638427734375, -3.42822265625, -3.218017578125, -3.0078125, -2.797607421875, -2.58740234375, -2.377197265625, -2.1669921875, -1.956787109375, -1.74658203125, -1.536376953125, -1.326171875, -1.115966796875, -0.90576171875, -0.695556640625, -0.4853515625, -0.275146484375, -0.06494140625, 0.145263671875, 0.35546875, 0.565673828125, 0.77587890625, 0.986083984375, 1.1962890625, 1.406494140625, 1.61669921875, 1.826904296875, 2.037109375, 2.247314453125, 2.45751953125, 2.667724609375, 2.8779296875, 3.088134765625, 3.29833984375, 3.508544921875, 3.71875, 3.928955078125, 4.13916015625, 4.349365234375, 4.5595703125, 4.769775390625, 4.97998046875, 5.190185546875, 5.400390625, 5.610595703125, 5.82080078125, 6.031005859375, 6.2412109375, 6.451416015625, 6.66162109375, 6.871826171875, 7.08203125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 9.0, 5.0, 9.0, 7.0, 15.0, 9.0, 23.0, 20.0, 27.0, 38.0, 58.0, 84.0, 92.0, 131.0, 212.0, 321.0, 617.0, 1752.0, 8739.0, 53814.0, 363762.0, 526061.0, 76350.0, 12134.0, 2375.0, 736.0, 369.0, 229.0, 141.0, 107.0, 67.0, 50.0, 47.0, 35.0, 24.0, 19.0, 18.0, 11.0, 8.0, 9.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6796875, -13.23974609375, -12.7998046875, -12.35986328125, -11.919921875, -11.47998046875, -11.0400390625, -10.60009765625, -10.16015625, -9.72021484375, -9.2802734375, -8.84033203125, -8.400390625, -7.96044921875, -7.5205078125, -7.08056640625, -6.640625, -6.20068359375, -5.7607421875, -5.32080078125, -4.880859375, -4.44091796875, -4.0009765625, -3.56103515625, -3.12109375, -2.68115234375, -2.2412109375, -1.80126953125, -1.361328125, -0.92138671875, -0.4814453125, -0.04150390625, 0.3984375, 0.83837890625, 1.2783203125, 1.71826171875, 2.158203125, 2.59814453125, 3.0380859375, 3.47802734375, 3.91796875, 4.35791015625, 4.7978515625, 5.23779296875, 5.677734375, 6.11767578125, 6.5576171875, 6.99755859375, 7.4375, 7.87744140625, 8.3173828125, 8.75732421875, 9.197265625, 9.63720703125, 10.0771484375, 10.51708984375, 10.95703125, 11.39697265625, 11.8369140625, 12.27685546875, 12.716796875, 13.15673828125, 13.5966796875, 14.03662109375, 14.4765625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 5.0, 2.0, 11.0, 4.0, 12.0, 4.0, 14.0, 16.0, 14.0, 16.0, 18.0, 24.0, 27.0, 35.0, 33.0, 46.0, 38.0, 49.0, 64.0, 110.0, 199.0, 1496.0, 212.0, 96.0, 80.0, 49.0, 54.0, 44.0, 27.0, 30.0, 31.0, 34.0, 24.0, 25.0, 18.0, 23.0, 12.0, 8.0, 4.0, 10.0, 6.0, 5.0, 8.0, 6.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.734375, -22.035888671875, -21.33740234375, -20.638916015625, -19.9404296875, -19.241943359375, -18.54345703125, -17.844970703125, -17.146484375, -16.447998046875, -15.74951171875, -15.051025390625, -14.3525390625, -13.654052734375, -12.95556640625, -12.257080078125, -11.55859375, -10.860107421875, -10.16162109375, -9.463134765625, -8.7646484375, -8.066162109375, -7.36767578125, -6.669189453125, -5.970703125, -5.272216796875, -4.57373046875, -3.875244140625, -3.1767578125, -2.478271484375, -1.77978515625, -1.081298828125, -0.3828125, 0.315673828125, 1.01416015625, 1.712646484375, 2.4111328125, 3.109619140625, 3.80810546875, 4.506591796875, 5.205078125, 5.903564453125, 6.60205078125, 7.300537109375, 7.9990234375, 8.697509765625, 9.39599609375, 10.094482421875, 10.79296875, 11.491455078125, 12.18994140625, 12.888427734375, 13.5869140625, 14.285400390625, 14.98388671875, 15.682373046875, 16.380859375, 17.079345703125, 17.77783203125, 18.476318359375, 19.1748046875, 19.873291015625, 20.57177734375, 21.270263671875, 21.96875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 9.0, 15.0, 8.0, 18.0, 24.0, 26.0, 44.0, 51.0, 76.0, 98.0, 115.0, 232.0, 401.0, 1121.0, 25260.0, 3111692.0, 4859.0, 737.0, 296.0, 179.0, 127.0, 79.0, 61.0, 54.0, 32.0, 26.0, 28.0, 13.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-108.1875, -105.037109375, -101.88671875, -98.736328125, -95.5859375, -92.435546875, -89.28515625, -86.134765625, -82.984375, -79.833984375, -76.68359375, -73.533203125, -70.3828125, -67.232421875, -64.08203125, -60.931640625, -57.78125, -54.630859375, -51.48046875, -48.330078125, -45.1796875, -42.029296875, -38.87890625, -35.728515625, -32.578125, -29.427734375, -26.27734375, -23.126953125, -19.9765625, -16.826171875, -13.67578125, -10.525390625, -7.375, -4.224609375, -1.07421875, 2.076171875, 5.2265625, 8.376953125, 11.52734375, 14.677734375, 17.828125, 20.978515625, 24.12890625, 27.279296875, 30.4296875, 33.580078125, 36.73046875, 39.880859375, 43.03125, 46.181640625, 49.33203125, 52.482421875, 55.6328125, 58.783203125, 61.93359375, 65.083984375, 68.234375, 71.384765625, 74.53515625, 77.685546875, 80.8359375, 83.986328125, 87.13671875, 90.287109375, 93.4375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [4.0, 5.0, 59.0, 167.0, 295.0, 306.0, 144.0, 25.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.430879592895508, -9.155984878540039, -6.88109016418457, -4.606195449829102, -2.331300735473633, -0.05640602111816406, 2.2184886932373047, 4.493383407592773, 6.768278121948242, 9.043172836303711, 11.31806755065918, 13.592962265014648, 15.867856979370117, 18.142751693725586, 20.417646408081055, 22.692541122436523, 24.967435836791992, 27.24233055114746, 29.51722526550293, 31.7921199798584, 34.0670166015625, 36.34191131591797, 38.61680603027344, 40.891700744628906, 43.166595458984375, 45.441490173339844, 47.71638488769531, 49.99127960205078, 52.26617431640625, 54.54106903076172, 56.81596374511719, 59.090858459472656, 61.365753173828125, 63.640647888183594, 65.91554260253906, 68.19043731689453, 70.46533203125, 72.74022674560547, 75.01512145996094, 77.2900161743164, 79.56491088867188, 81.83980560302734, 84.11470031738281, 86.38959503173828, 88.66448974609375, 90.93938446044922, 93.21427917480469, 95.48917388916016, 97.76406860351562, 100.0389633178711, 102.31385803222656, 104.58875274658203, 106.8636474609375, 109.13854217529297, 111.41343688964844, 113.6883316040039, 115.96322631835938, 118.23812103271484, 120.51301574707031, 122.78791046142578, 125.06280517578125, 127.33769989013672, 129.6125946044922, 131.88748168945312, 134.16238403320312]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 3.0, 3.0, 6.0, 9.0, 13.0, 7.0, 14.0, 12.0, 15.0, 22.0, 27.0, 22.0, 28.0, 33.0, 26.0, 39.0, 29.0, 36.0, 38.0, 31.0, 32.0, 43.0, 41.0, 45.0, 46.0, 34.0, 25.0, 28.0, 40.0, 25.0, 21.0, 27.0, 17.0, 19.0, 12.0, 16.0, 16.0, 13.0, 10.0, 16.0, 8.0, 10.0, 7.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 4.0, 3.0], "bins": [-57.18463134765625, -55.519927978515625, -53.855224609375, -52.190521240234375, -50.52581787109375, -48.861114501953125, -47.196414947509766, -45.53171157836914, -43.867008209228516, -42.20230484008789, -40.537601470947266, -38.87289810180664, -37.20819854736328, -35.543495178222656, -33.87879180908203, -32.214088439941406, -30.54938507080078, -28.884681701660156, -27.21997833251953, -25.55527687072754, -23.890573501586914, -22.22587013244629, -20.561168670654297, -18.896465301513672, -17.231761932373047, -15.567058563232422, -13.902356147766113, -12.237653732299805, -10.57295036315918, -8.908246994018555, -7.243544578552246, -5.5788421630859375, -3.914142608642578, -2.2494397163391113, -0.5847368240356445, 1.0799660682678223, 2.744668960571289, 4.409372329711914, 6.074074745178223, 7.738777160644531, 9.403480529785156, 11.068183898925781, 12.73288631439209, 14.397588729858398, 16.062292098999023, 17.72699546813965, 19.39169692993164, 21.056400299072266, 22.72110366821289, 24.385807037353516, 26.05051040649414, 27.715211868286133, 29.379915237426758, 31.044618606567383, 32.709320068359375, 34.3740234375, 36.038726806640625, 37.70343017578125, 39.368133544921875, 41.0328369140625, 42.697540283203125, 44.36224365234375, 46.02694320678711, 47.691646575927734, 49.35634994506836]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 6.0, 9.0, 8.0, 9.0, 12.0, 9.0, 12.0, 16.0, 17.0, 14.0, 25.0, 28.0, 32.0, 39.0, 43.0, 41.0, 41.0, 48.0, 38.0, 41.0, 55.0, 37.0, 38.0, 45.0, 44.0, 33.0, 28.0, 33.0, 30.0, 26.0, 30.0, 12.0, 18.0, 15.0, 11.0, 10.0, 10.0, 10.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.171875, -6.92578125, -6.6796875, -6.43359375, -6.1875, -5.94140625, -5.6953125, -5.44921875, -5.203125, -4.95703125, -4.7109375, -4.46484375, -4.21875, -3.97265625, -3.7265625, -3.48046875, -3.234375, -2.98828125, -2.7421875, -2.49609375, -2.25, -2.00390625, -1.7578125, -1.51171875, -1.265625, -1.01953125, -0.7734375, -0.52734375, -0.28125, -0.03515625, 0.2109375, 0.45703125, 0.703125, 0.94921875, 1.1953125, 1.44140625, 1.6875, 1.93359375, 2.1796875, 2.42578125, 2.671875, 2.91796875, 3.1640625, 3.41015625, 3.65625, 3.90234375, 4.1484375, 4.39453125, 4.640625, 4.88671875, 5.1328125, 5.37890625, 5.625, 5.87109375, 6.1171875, 6.36328125, 6.609375, 6.85546875, 7.1015625, 7.34765625, 7.59375, 7.83984375, 8.0859375, 8.33203125, 8.578125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 5.0, 6.0, 3.0, 15.0, 19.0, 18.0, 34.0, 44.0, 74.0, 78.0, 103.0, 167.0, 315.0, 605.0, 1651.0, 5105.0, 20197.0, 90556.0, 387350.0, 1147223.0, 1532506.0, 743585.0, 203765.0, 45047.0, 10727.0, 2866.0, 1040.0, 440.0, 237.0, 142.0, 86.0, 56.0, 57.0, 28.0, 25.0, 21.0, 13.0, 20.0, 11.0, 6.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.853759765625, -8.55126953125, -8.248779296875, -7.9462890625, -7.643798828125, -7.34130859375, -7.038818359375, -6.736328125, -6.433837890625, -6.13134765625, -5.828857421875, -5.5263671875, -5.223876953125, -4.92138671875, -4.618896484375, -4.31640625, -4.013916015625, -3.71142578125, -3.408935546875, -3.1064453125, -2.803955078125, -2.50146484375, -2.198974609375, -1.896484375, -1.593994140625, -1.29150390625, -0.989013671875, -0.6865234375, -0.384033203125, -0.08154296875, 0.220947265625, 0.5234375, 0.825927734375, 1.12841796875, 1.430908203125, 1.7333984375, 2.035888671875, 2.33837890625, 2.640869140625, 2.943359375, 3.245849609375, 3.54833984375, 3.850830078125, 4.1533203125, 4.455810546875, 4.75830078125, 5.060791015625, 5.36328125, 5.665771484375, 5.96826171875, 6.270751953125, 6.5732421875, 6.875732421875, 7.17822265625, 7.480712890625, 7.783203125, 8.085693359375, 8.38818359375, 8.690673828125, 8.9931640625, 9.295654296875, 9.59814453125, 9.900634765625, 10.203125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 8.0, 13.0, 3.0, 17.0, 31.0, 44.0, 80.0, 100.0, 142.0, 201.0, 321.0, 473.0, 560.0, 594.0, 497.0, 333.0, 218.0, 143.0, 94.0, 59.0, 47.0, 37.0, 28.0, 14.0, 6.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.640625, -21.0562744140625, -20.471923828125, -19.8875732421875, -19.30322265625, -18.7188720703125, -18.134521484375, -17.5501708984375, -16.9658203125, -16.3814697265625, -15.797119140625, -15.2127685546875, -14.62841796875, -14.0440673828125, -13.459716796875, -12.8753662109375, -12.291015625, -11.7066650390625, -11.122314453125, -10.5379638671875, -9.95361328125, -9.3692626953125, -8.784912109375, -8.2005615234375, -7.6162109375, -7.0318603515625, -6.447509765625, -5.8631591796875, -5.27880859375, -4.6944580078125, -4.110107421875, -3.5257568359375, -2.94140625, -2.3570556640625, -1.772705078125, -1.1883544921875, -0.60400390625, -0.0196533203125, 0.564697265625, 1.1490478515625, 1.7333984375, 2.3177490234375, 2.902099609375, 3.4864501953125, 4.07080078125, 4.6551513671875, 5.239501953125, 5.8238525390625, 6.408203125, 6.9925537109375, 7.576904296875, 8.1612548828125, 8.74560546875, 9.3299560546875, 9.914306640625, 10.4986572265625, 11.0830078125, 11.6673583984375, 12.251708984375, 12.8360595703125, 13.42041015625, 14.0047607421875, 14.589111328125, 15.1734619140625, 15.7578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 9.0, 8.0, 24.0, 39.0, 49.0, 63.0, 118.0, 222.0, 407.0, 933.0, 3103.0, 342894.0, 3832103.0, 11570.0, 1413.0, 596.0, 309.0, 153.0, 110.0, 62.0, 43.0, 18.0, 8.0, 11.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.8125, -54.7265625, -52.640625, -50.5546875, -48.46875, -46.3828125, -44.296875, -42.2109375, -40.125, -38.0390625, -35.953125, -33.8671875, -31.78125, -29.6953125, -27.609375, -25.5234375, -23.4375, -21.3515625, -19.265625, -17.1796875, -15.09375, -13.0078125, -10.921875, -8.8359375, -6.75, -4.6640625, -2.578125, -0.4921875, 1.59375, 3.6796875, 5.765625, 7.8515625, 9.9375, 12.0234375, 14.109375, 16.1953125, 18.28125, 20.3671875, 22.453125, 24.5390625, 26.625, 28.7109375, 30.796875, 32.8828125, 34.96875, 37.0546875, 39.140625, 41.2265625, 43.3125, 45.3984375, 47.484375, 49.5703125, 51.65625, 53.7421875, 55.828125, 57.9140625, 60.0, 62.0859375, 64.171875, 66.2578125, 68.34375, 70.4296875, 72.515625, 74.6015625, 76.6875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 9.0, 139.0, 435.0, 356.0, 71.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-233.53562927246094, -226.1939239501953, -218.85220336914062, -211.510498046875, -204.16879272460938, -196.8270721435547, -189.48536682128906, -182.14364624023438, -174.80194091796875, -167.46023559570312, -160.11851501464844, -152.7768096923828, -145.4351043701172, -138.0933837890625, -130.75167846679688, -123.40996551513672, -116.0682601928711, -108.72654724121094, -101.38484191894531, -94.04312896728516, -86.701416015625, -79.35971069335938, -72.01799774169922, -64.67628479003906, -57.33457565307617, -49.99286651611328, -42.651153564453125, -35.309444427490234, -27.96773338317871, -20.626022338867188, -13.284313201904297, -5.942600250244141, 1.39910888671875, 8.740819931030273, 16.082530975341797, 23.424240112304688, 30.76595115661621, 38.107662200927734, 45.449371337890625, 52.79108428955078, 60.13279342651367, 67.47450256347656, 74.81621551513672, 82.15792846679688, 89.4996337890625, 96.84134674072266, 104.18305969238281, 111.52476501464844, 118.8664779663086, 126.20819091796875, 133.54989624023438, 140.8916015625, 148.2333221435547, 155.5750274658203, 162.916748046875, 170.25845336914062, 177.60015869140625, 184.94186401367188, 192.28358459472656, 199.6252899169922, 206.9669952392578, 214.3087158203125, 221.65042114257812, 228.99212646484375, 236.33384704589844]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 11.0, 6.0, 8.0, 11.0, 10.0, 17.0, 18.0, 19.0, 24.0, 20.0, 17.0, 31.0, 34.0, 32.0, 34.0, 48.0, 40.0, 42.0, 39.0, 39.0, 49.0, 30.0, 38.0, 34.0, 28.0, 24.0, 43.0, 37.0, 30.0, 35.0, 27.0, 24.0, 18.0, 22.0, 10.0, 10.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.094520568847656, -44.69280242919922, -43.29108428955078, -41.88936996459961, -40.48765182495117, -39.085933685302734, -37.6842155456543, -36.282501220703125, -34.88078308105469, -33.47906494140625, -32.07734680175781, -30.675630569458008, -29.273914337158203, -27.872196197509766, -26.470478057861328, -25.068761825561523, -23.667043685913086, -22.26532554626465, -20.863609313964844, -19.461891174316406, -18.0601749420166, -16.658456802368164, -15.256739616394043, -13.855022430419922, -12.4533052444458, -11.05158805847168, -9.649870872497559, -8.248153686523438, -6.846436023712158, -5.444718837738037, -4.043001174926758, -2.6412839889526367, -1.2395668029785156, 0.16215050220489502, 1.5638678073883057, 2.965585231781006, 4.367302417755127, 5.769019603729248, 7.170737266540527, 8.572454452514648, 9.97417163848877, 11.37588882446289, 12.777606010437012, 14.179323196411133, 15.58104133605957, 16.982757568359375, 18.384475708007812, 19.78619384765625, 21.187910079956055, 22.589628219604492, 23.991344451904297, 25.393062591552734, 26.79477882385254, 28.196496963500977, 29.59821319580078, 30.99993133544922, 32.401649475097656, 33.803367614746094, 35.20508575439453, 36.6068000793457, 38.00851821899414, 39.41023635864258, 40.811954498291016, 42.21366882324219, 43.615386962890625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 5.0, 6.0, 7.0, 12.0, 9.0, 9.0, 9.0, 23.0, 20.0, 17.0, 21.0, 25.0, 29.0, 38.0, 41.0, 45.0, 34.0, 31.0, 47.0, 47.0, 34.0, 30.0, 50.0, 48.0, 32.0, 27.0, 32.0, 24.0, 23.0, 21.0, 26.0, 34.0, 24.0, 17.0, 25.0, 9.0, 10.0, 9.0, 8.0, 10.0, 6.0, 3.0, 4.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.5234375, -7.30572509765625, -7.0880126953125, -6.87030029296875, -6.652587890625, -6.43487548828125, -6.2171630859375, -5.99945068359375, -5.78173828125, -5.56402587890625, -5.3463134765625, -5.12860107421875, -4.910888671875, -4.69317626953125, -4.4754638671875, -4.25775146484375, -4.0400390625, -3.82232666015625, -3.6046142578125, -3.38690185546875, -3.169189453125, -2.95147705078125, -2.7337646484375, -2.51605224609375, -2.29833984375, -2.08062744140625, -1.8629150390625, -1.64520263671875, -1.427490234375, -1.20977783203125, -0.9920654296875, -0.77435302734375, -0.556640625, -0.33892822265625, -0.1212158203125, 0.09649658203125, 0.314208984375, 0.53192138671875, 0.7496337890625, 0.96734619140625, 1.18505859375, 1.40277099609375, 1.6204833984375, 1.83819580078125, 2.055908203125, 2.27362060546875, 2.4913330078125, 2.70904541015625, 2.9267578125, 3.14447021484375, 3.3621826171875, 3.57989501953125, 3.797607421875, 4.01531982421875, 4.2330322265625, 4.45074462890625, 4.66845703125, 4.88616943359375, 5.1038818359375, 5.32159423828125, 5.539306640625, 5.75701904296875, 5.9747314453125, 6.19244384765625, 6.41015625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 16.0, 9.0, 16.0, 39.0, 40.0, 59.0, 111.0, 134.0, 240.0, 368.0, 474.0, 806.0, 1096.0, 1662.0, 2535.0, 4005.0, 5702.0, 8705.0, 13450.0, 20482.0, 31647.0, 48791.0, 75336.0, 116379.0, 172006.0, 182280.0, 126674.0, 81928.0, 53161.0, 34550.0, 22760.0, 14681.0, 9601.0, 6346.0, 4137.0, 2729.0, 1921.0, 1207.0, 819.0, 525.0, 391.0, 262.0, 149.0, 124.0, 68.0, 50.0, 34.0, 16.0, 10.0, 10.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.49951171875, -0.48345184326171875, -0.4673919677734375, -0.45133209228515625, -0.435272216796875, -0.41921234130859375, -0.4031524658203125, -0.38709259033203125, -0.37103271484375, -0.35497283935546875, -0.3389129638671875, -0.32285308837890625, -0.306793212890625, -0.29073333740234375, -0.2746734619140625, -0.25861358642578125, -0.2425537109375, -0.22649383544921875, -0.2104339599609375, -0.19437408447265625, -0.178314208984375, -0.16225433349609375, -0.1461944580078125, -0.13013458251953125, -0.11407470703125, -0.09801483154296875, -0.0819549560546875, -0.06589508056640625, -0.049835205078125, -0.03377532958984375, -0.0177154541015625, -0.00165557861328125, 0.014404296875, 0.03046417236328125, 0.0465240478515625, 0.06258392333984375, 0.078643798828125, 0.09470367431640625, 0.1107635498046875, 0.12682342529296875, 0.14288330078125, 0.15894317626953125, 0.1750030517578125, 0.19106292724609375, 0.207122802734375, 0.22318267822265625, 0.2392425537109375, 0.25530242919921875, 0.2713623046875, 0.28742218017578125, 0.3034820556640625, 0.31954193115234375, 0.335601806640625, 0.35166168212890625, 0.3677215576171875, 0.38378143310546875, 0.39984130859375, 0.41590118408203125, 0.4319610595703125, 0.44802093505859375, 0.464080810546875, 0.48014068603515625, 0.4962005615234375, 0.5122604370117188, 0.5283203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 10.0, 7.0, 13.0, 17.0, 6.0, 18.0, 12.0, 19.0, 29.0, 25.0, 30.0, 28.0, 39.0, 32.0, 32.0, 32.0, 47.0, 41.0, 1069.0, 44.0, 47.0, 41.0, 43.0, 50.0, 34.0, 40.0, 37.0, 22.0, 27.0, 23.0, 14.0, 19.0, 15.0, 15.0, 5.0, 9.0, 9.0, 2.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.02734375, -4.874267578125, -4.72119140625, -4.568115234375, -4.4150390625, -4.261962890625, -4.10888671875, -3.955810546875, -3.802734375, -3.649658203125, -3.49658203125, -3.343505859375, -3.1904296875, -3.037353515625, -2.88427734375, -2.731201171875, -2.578125, -2.425048828125, -2.27197265625, -2.118896484375, -1.9658203125, -1.812744140625, -1.65966796875, -1.506591796875, -1.353515625, -1.200439453125, -1.04736328125, -0.894287109375, -0.7412109375, -0.588134765625, -0.43505859375, -0.281982421875, -0.12890625, 0.024169921875, 0.17724609375, 0.330322265625, 0.4833984375, 0.636474609375, 0.78955078125, 0.942626953125, 1.095703125, 1.248779296875, 1.40185546875, 1.554931640625, 1.7080078125, 1.861083984375, 2.01416015625, 2.167236328125, 2.3203125, 2.473388671875, 2.62646484375, 2.779541015625, 2.9326171875, 3.085693359375, 3.23876953125, 3.391845703125, 3.544921875, 3.697998046875, 3.85107421875, 4.004150390625, 4.1572265625, 4.310302734375, 4.46337890625, 4.616455078125, 4.76953125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 10.0, 5.0, 14.0, 16.0, 30.0, 36.0, 64.0, 52.0, 123.0, 155.0, 244.0, 367.0, 508.0, 780.0, 1103.0, 1627.0, 2264.0, 3328.0, 4737.0, 7113.0, 10266.0, 14912.0, 22071.0, 32274.0, 46914.0, 68790.0, 99836.0, 138226.0, 1207036.0, 132681.0, 94694.0, 65478.0, 44722.0, 30901.0, 20450.0, 14143.0, 9734.0, 6507.0, 4705.0, 3126.0, 2243.0, 1530.0, 990.0, 706.0, 518.0, 327.0, 253.0, 184.0, 102.0, 68.0, 47.0, 56.0, 30.0, 14.0, 12.0, 8.0, 7.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.376220703125, -0.3638572692871094, -0.35149383544921875, -0.3391304016113281, -0.3267669677734375, -0.3144035339355469, -0.30204010009765625, -0.2896766662597656, -0.277313232421875, -0.2649497985839844, -0.25258636474609375, -0.24022293090820312, -0.2278594970703125, -0.21549606323242188, -0.20313262939453125, -0.19076919555664062, -0.17840576171875, -0.16604232788085938, -0.15367889404296875, -0.14131546020507812, -0.1289520263671875, -0.11658859252929688, -0.10422515869140625, -0.09186172485351562, -0.079498291015625, -0.06713485717773438, -0.05477142333984375, -0.042407989501953125, -0.0300445556640625, -0.017681121826171875, -0.00531768798828125, 0.007045745849609375, 0.0194091796875, 0.031772613525390625, 0.04413604736328125, 0.056499481201171875, 0.0688629150390625, 0.08122634887695312, 0.09358978271484375, 0.10595321655273438, 0.118316650390625, 0.13068008422851562, 0.14304351806640625, 0.15540695190429688, 0.1677703857421875, 0.18013381958007812, 0.19249725341796875, 0.20486068725585938, 0.21722412109375, 0.22958755493164062, 0.24195098876953125, 0.2543144226074219, 0.2666778564453125, 0.2790412902832031, 0.29140472412109375, 0.3037681579589844, 0.316131591796875, 0.3284950256347656, 0.34085845947265625, 0.3532218933105469, 0.3655853271484375, 0.3779487609863281, 0.39031219482421875, 0.4026756286621094, 0.4150390625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 5.0, 10.0, 13.0, 18.0, 13.0, 13.0, 24.0, 28.0, 51.0, 32.0, 54.0, 72.0, 55.0, 67.0, 59.0, 61.0, 63.0, 56.0, 54.0, 47.0, 40.0, 29.0, 19.0, 26.0, 12.0, 18.0, 12.0, 6.0, 10.0, 8.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0017175674438476562, -0.0016696304082870483, -0.0016216933727264404, -0.0015737563371658325, -0.0015258193016052246, -0.0014778822660446167, -0.0014299452304840088, -0.0013820081949234009, -0.001334071159362793, -0.001286134123802185, -0.0012381970882415771, -0.0011902600526809692, -0.0011423230171203613, -0.0010943859815597534, -0.0010464489459991455, -0.0009985119104385376, -0.0009505748748779297, -0.0009026378393173218, -0.0008547008037567139, -0.000806763768196106, -0.000758826732635498, -0.0007108896970748901, -0.0006629526615142822, -0.0006150156259536743, -0.0005670785903930664, -0.0005191415548324585, -0.0004712045192718506, -0.0004232674837112427, -0.00037533044815063477, -0.00032739341259002686, -0.00027945637702941895, -0.00023151934146881104, -0.00018358230590820312, -0.00013564527034759521, -8.77082347869873e-05, -3.9771199226379395e-05, 8.165836334228516e-06, 5.6102871894836426e-05, 0.00010403990745544434, 0.00015197694301605225, 0.00019991397857666016, 0.00024785101413726807, 0.000295788049697876, 0.0003437250852584839, 0.0003916621208190918, 0.0004395991563796997, 0.0004875361919403076, 0.0005354732275009155, 0.0005834102630615234, 0.0006313472986221313, 0.0006792843341827393, 0.0007272213697433472, 0.0007751584053039551, 0.000823095440864563, 0.0008710324764251709, 0.0009189695119857788, 0.0009669065475463867, 0.0010148435831069946, 0.0010627806186676025, 0.0011107176542282104, 0.0011586546897888184, 0.0012065917253494263, 0.0012545287609100342, 0.001302465796470642, 0.00135040283203125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 4.0, 6.0, 13.0, 7.0, 20.0, 25.0, 27.0, 44.0, 55.0, 77.0, 94.0, 135.0, 264.0, 591.0, 1945.0, 909959.0, 133024.0, 1066.0, 441.0, 225.0, 148.0, 86.0, 84.0, 51.0, 42.0, 21.0, 18.0, 15.0, 11.0, 10.0, 11.0, 8.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028564453125, -0.027538299560546875, -0.02651214599609375, -0.025485992431640625, -0.0244598388671875, -0.023433685302734375, -0.02240753173828125, -0.021381378173828125, -0.020355224609375, -0.019329071044921875, -0.01830291748046875, -0.017276763916015625, -0.0162506103515625, -0.015224456787109375, -0.01419830322265625, -0.013172149658203125, -0.01214599609375, -0.011119842529296875, -0.01009368896484375, -0.009067535400390625, -0.0080413818359375, -0.007015228271484375, -0.00598907470703125, -0.004962921142578125, -0.003936767578125, -0.002910614013671875, -0.00188446044921875, -0.000858306884765625, 0.0001678466796875, 0.001194000244140625, 0.00222015380859375, 0.003246307373046875, 0.0042724609375, 0.005298614501953125, 0.00632476806640625, 0.007350921630859375, 0.0083770751953125, 0.009403228759765625, 0.01042938232421875, 0.011455535888671875, 0.012481689453125, 0.013507843017578125, 0.01453399658203125, 0.015560150146484375, 0.0165863037109375, 0.017612457275390625, 0.01863861083984375, 0.019664764404296875, 0.02069091796875, 0.021717071533203125, 0.02274322509765625, 0.023769378662109375, 0.0247955322265625, 0.025821685791015625, 0.02684783935546875, 0.027873992919921875, 0.028900146484375, 0.029926300048828125, 0.03095245361328125, 0.031978607177734375, 0.0330047607421875, 0.034030914306640625, 0.03505706787109375, 0.036083221435546875, 0.037109375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 20.0, 100.0, 345.0, 366.0, 148.0, 27.0, 9.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005234075710177422, -0.0051317536272108555, -0.005029431078583002, -0.004927108995616436, -0.00482478691264987, -0.0047224643640220165, -0.0046201422810554504, -0.004517819732427597, -0.004415497649461031, -0.004313175566494465, -0.0042108530178666115, -0.004108530934900045, -0.004006208851933479, -0.003903886303305626, -0.00380156422033906, -0.00369924190454185, -0.0035969195887446404, -0.0034945972729474306, -0.0033922751899808645, -0.003289952874183655, -0.003187630558386445, -0.0030853082425892353, -0.0029829861596226692, -0.0028806638438254595, -0.0027783417608588934, -0.0026760194450616837, -0.0025736973620951176, -0.002471375046297908, -0.002369052730500698, -0.002266730647534132, -0.0021644083317369223, -0.0020620860159397125, -0.001959763700142503, -0.0018574415007606149, -0.0017551191849634051, -0.0016527969855815172, -0.0015504746697843075, -0.0014481524704024196, -0.0013458302710205317, -0.001243507955223322, -0.0011411856394261122, -0.0010388634400442243, -0.0009365411242470145, -0.0008342189248651266, -0.0007318966090679169, -0.000629574409686029, -0.0005272521520964801, -0.0004249298945069313, -0.0003226076951250434, -0.00022028543753549457, -0.00011796319449786097, -1.564095146022737e-05, 8.668130612932146e-05, 0.00018900353461503983, 0.00029132579220458865, 0.0003936480497941375, 0.0004959703073836863, 0.0005982925649732351, 0.000700614822562784, 0.0008029370801523328, 0.0009052592795342207, 0.0010075815953314304, 0.0011099037947133183, 0.0012122259940952063, 0.001314548309892416]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 15.0, 15.0, 20.0, 15.0, 17.0, 34.0, 25.0, 31.0, 31.0, 40.0, 40.0, 32.0, 62.0, 41.0, 48.0, 56.0, 52.0, 46.0, 32.0, 43.0, 30.0, 28.0, 43.0, 30.0, 31.0, 20.0, 23.0, 17.0, 14.0, 14.0, 11.0, 10.0, 8.0, 4.0, 7.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006322264671325684, -0.0006057368591427803, -0.0005792472511529922, -0.0005527576431632042, -0.0005262680351734161, -0.0004997784271836281, -0.00047328881919384, -0.00044679921120405197, -0.0004203096032142639, -0.00039381999522447586, -0.0003673303872346878, -0.00034084077924489975, -0.0003143511712551117, -0.00028786156326532364, -0.0002613719552755356, -0.00023488234728574753, -0.00020839273929595947, -0.00018190313130617142, -0.00015541352331638336, -0.0001289239153265953, -0.00010243430733680725, -7.59446993470192e-05, -4.945509135723114e-05, -2.2965483367443085e-05, 3.5241246223449707e-06, 3.0013732612133026e-05, 5.650334060192108e-05, 8.299294859170914e-05, 0.00010948255658149719, 0.00013597216457128525, 0.0001624617725610733, 0.00018895138055086136, 0.00021544098854064941, 0.00024193059653043747, 0.0002684202045202255, 0.0002949098125100136, 0.00032139942049980164, 0.0003478890284895897, 0.00037437863647937775, 0.0004008682444691658, 0.00042735785245895386, 0.0004538474604487419, 0.00048033706843852997, 0.000506826676428318, 0.0005333162844181061, 0.0005598058924078941, 0.0005862955003976822, 0.0006127851083874702, 0.0006392747163772583, 0.0006657643243670464, 0.0006922539323568344, 0.0007187435403466225, 0.0007452331483364105, 0.0007717227563261986, 0.0007982123643159866, 0.0008247019723057747, 0.0008511915802955627, 0.0008776811882853508, 0.0009041707962751389, 0.0009306604042649269, 0.000957150012254715, 0.000983639620244503, 0.001010129228234291, 0.0010366188362240791, 0.0010631084442138672]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 5.0, 6.0, 7.0, 12.0, 9.0, 9.0, 9.0, 23.0, 20.0, 17.0, 21.0, 25.0, 29.0, 38.0, 41.0, 45.0, 34.0, 31.0, 47.0, 47.0, 34.0, 30.0, 50.0, 48.0, 32.0, 27.0, 32.0, 24.0, 23.0, 21.0, 26.0, 34.0, 24.0, 17.0, 25.0, 9.0, 10.0, 9.0, 8.0, 10.0, 6.0, 3.0, 4.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.5234375, -7.30572509765625, -7.0880126953125, -6.87030029296875, -6.652587890625, -6.43487548828125, -6.2171630859375, -5.99945068359375, -5.78173828125, -5.56402587890625, -5.3463134765625, -5.12860107421875, -4.910888671875, -4.69317626953125, -4.4754638671875, -4.25775146484375, -4.0400390625, -3.82232666015625, -3.6046142578125, -3.38690185546875, -3.169189453125, -2.95147705078125, -2.7337646484375, -2.51605224609375, -2.29833984375, -2.08062744140625, -1.8629150390625, -1.64520263671875, -1.427490234375, -1.20977783203125, -0.9920654296875, -0.77435302734375, -0.556640625, -0.33892822265625, -0.1212158203125, 0.09649658203125, 0.314208984375, 0.53192138671875, 0.7496337890625, 0.96734619140625, 1.18505859375, 1.40277099609375, 1.6204833984375, 1.83819580078125, 2.055908203125, 2.27362060546875, 2.4913330078125, 2.70904541015625, 2.9267578125, 3.14447021484375, 3.3621826171875, 3.57989501953125, 3.797607421875, 4.01531982421875, 4.2330322265625, 4.45074462890625, 4.66845703125, 4.88616943359375, 5.1038818359375, 5.32159423828125, 5.539306640625, 5.75701904296875, 5.9747314453125, 6.19244384765625, 6.41015625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 10.0, 3.0, 5.0, 6.0, 6.0, 6.0, 14.0, 11.0, 14.0, 30.0, 39.0, 74.0, 85.0, 236.0, 402.0, 904.0, 2080.0, 4901.0, 11473.0, 26692.0, 66531.0, 188736.0, 380918.0, 228999.0, 80651.0, 31916.0, 13320.0, 5843.0, 2500.0, 1093.0, 488.0, 235.0, 118.0, 66.0, 35.0, 34.0, 22.0, 15.0, 10.0, 9.0, 9.0, 6.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.9447021484375, -8.678466796875, -8.4122314453125, -8.14599609375, -7.8797607421875, -7.613525390625, -7.3472900390625, -7.0810546875, -6.8148193359375, -6.548583984375, -6.2823486328125, -6.01611328125, -5.7498779296875, -5.483642578125, -5.2174072265625, -4.951171875, -4.6849365234375, -4.418701171875, -4.1524658203125, -3.88623046875, -3.6199951171875, -3.353759765625, -3.0875244140625, -2.8212890625, -2.5550537109375, -2.288818359375, -2.0225830078125, -1.75634765625, -1.4901123046875, -1.223876953125, -0.9576416015625, -0.69140625, -0.4251708984375, -0.158935546875, 0.1072998046875, 0.37353515625, 0.6397705078125, 0.906005859375, 1.1722412109375, 1.4384765625, 1.7047119140625, 1.970947265625, 2.2371826171875, 2.50341796875, 2.7696533203125, 3.035888671875, 3.3021240234375, 3.568359375, 3.8345947265625, 4.100830078125, 4.3670654296875, 4.63330078125, 4.8995361328125, 5.165771484375, 5.4320068359375, 5.6982421875, 5.9644775390625, 6.230712890625, 6.4969482421875, 6.76318359375, 7.0294189453125, 7.295654296875, 7.5618896484375, 7.828125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 2.0, 5.0, 12.0, 8.0, 11.0, 11.0, 8.0, 18.0, 36.0, 22.0, 39.0, 38.0, 49.0, 38.0, 55.0, 58.0, 92.0, 178.0, 1410.0, 345.0, 131.0, 85.0, 89.0, 47.0, 44.0, 24.0, 32.0, 22.0, 27.0, 22.0, 16.0, 16.0, 16.0, 7.0, 12.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.984375, -22.131103515625, -21.27783203125, -20.424560546875, -19.5712890625, -18.718017578125, -17.86474609375, -17.011474609375, -16.158203125, -15.304931640625, -14.45166015625, -13.598388671875, -12.7451171875, -11.891845703125, -11.03857421875, -10.185302734375, -9.33203125, -8.478759765625, -7.62548828125, -6.772216796875, -5.9189453125, -5.065673828125, -4.21240234375, -3.359130859375, -2.505859375, -1.652587890625, -0.79931640625, 0.053955078125, 0.9072265625, 1.760498046875, 2.61376953125, 3.467041015625, 4.3203125, 5.173583984375, 6.02685546875, 6.880126953125, 7.7333984375, 8.586669921875, 9.43994140625, 10.293212890625, 11.146484375, 11.999755859375, 12.85302734375, 13.706298828125, 14.5595703125, 15.412841796875, 16.26611328125, 17.119384765625, 17.97265625, 18.825927734375, 19.67919921875, 20.532470703125, 21.3857421875, 22.239013671875, 23.09228515625, 23.945556640625, 24.798828125, 25.652099609375, 26.50537109375, 27.358642578125, 28.2119140625, 29.065185546875, 29.91845703125, 30.771728515625, 31.625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 8.0, 17.0, 27.0, 36.0, 55.0, 73.0, 113.0, 181.0, 277.0, 560.0, 1531.0, 47292.0, 3074774.0, 18222.0, 1175.0, 514.0, 309.0, 167.0, 113.0, 68.0, 36.0, 32.0, 23.0, 17.0, 17.0, 15.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.3125, -58.1123046875, -55.912109375, -53.7119140625, -51.51171875, -49.3115234375, -47.111328125, -44.9111328125, -42.7109375, -40.5107421875, -38.310546875, -36.1103515625, -33.91015625, -31.7099609375, -29.509765625, -27.3095703125, -25.109375, -22.9091796875, -20.708984375, -18.5087890625, -16.30859375, -14.1083984375, -11.908203125, -9.7080078125, -7.5078125, -5.3076171875, -3.107421875, -0.9072265625, 1.29296875, 3.4931640625, 5.693359375, 7.8935546875, 10.09375, 12.2939453125, 14.494140625, 16.6943359375, 18.89453125, 21.0947265625, 23.294921875, 25.4951171875, 27.6953125, 29.8955078125, 32.095703125, 34.2958984375, 36.49609375, 38.6962890625, 40.896484375, 43.0966796875, 45.296875, 47.4970703125, 49.697265625, 51.8974609375, 54.09765625, 56.2978515625, 58.498046875, 60.6982421875, 62.8984375, 65.0986328125, 67.298828125, 69.4990234375, 71.69921875, 73.8994140625, 76.099609375, 78.2998046875, 80.5]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 34.0, 66.0, 139.0, 200.0, 207.0, 165.0, 94.0, 72.0, 21.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15580940246582, -18.501420974731445, -16.84703254699707, -15.192644119262695, -13.53825569152832, -11.883867263793945, -10.22947883605957, -8.575090408325195, -6.92070198059082, -5.266313552856445, -3.6119251251220703, -1.9575366973876953, -0.3031482696533203, 1.3512401580810547, 3.0056285858154297, 4.660017013549805, 6.31440544128418, 7.968793869018555, 9.62318229675293, 11.277570724487305, 12.93195915222168, 14.586347579956055, 16.24073600769043, 17.895124435424805, 19.54951286315918, 21.203901290893555, 22.85828971862793, 24.512678146362305, 26.16706657409668, 27.821455001831055, 29.47584342956543, 31.130231857299805, 32.78462219238281, 34.43901062011719, 36.09339904785156, 37.74778747558594, 39.40217590332031, 41.05656433105469, 42.71095275878906, 44.36534118652344, 46.01972961425781, 47.67411804199219, 49.32850646972656, 50.98289489746094, 52.63728332519531, 54.29167175292969, 55.94606018066406, 57.60044860839844, 59.25483703613281, 60.90922546386719, 62.56361389160156, 64.21800231933594, 65.87239074707031, 67.52677917480469, 69.18116760253906, 70.83555603027344, 72.48994445800781, 74.14433288574219, 75.79872131347656, 77.45310974121094, 79.10749816894531, 80.76188659667969, 82.41627502441406, 84.07066345214844, 85.72505187988281]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 8.0, 10.0, 5.0, 7.0, 20.0, 26.0, 8.0, 15.0, 27.0, 24.0, 28.0, 41.0, 35.0, 35.0, 42.0, 38.0, 45.0, 43.0, 42.0, 38.0, 36.0, 40.0, 56.0, 36.0, 34.0, 37.0, 35.0, 26.0, 24.0, 30.0, 10.0, 17.0, 13.0, 13.0, 11.0, 13.0, 9.0, 5.0, 6.0, 4.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-54.48859786987305, -52.599021911621094, -50.70944595336914, -48.81986999511719, -46.93029022216797, -45.04071807861328, -43.15113830566406, -41.26156234741211, -39.371986389160156, -37.4824104309082, -35.59283447265625, -33.7032585144043, -31.81368064880371, -29.924104690551758, -28.034526824951172, -26.14495086669922, -24.255374908447266, -22.365798950195312, -20.47622299194336, -18.586645126342773, -16.69706916809082, -14.807493209838867, -12.917916297912598, -11.028339385986328, -9.138763427734375, -7.249186992645264, -5.359610557556152, -3.470034122467041, -1.5804576873779297, 0.30911827087402344, 2.198695182800293, 4.0882720947265625, 5.97784423828125, 7.867420673370361, 9.756997108459473, 11.646574020385742, 13.536149978637695, 15.425725936889648, 17.315303802490234, 19.204879760742188, 21.09445571899414, 22.984031677246094, 24.873607635498047, 26.763185501098633, 28.652761459350586, 30.54233741760254, 32.431915283203125, 34.32149124145508, 36.21106719970703, 38.100643157958984, 39.99021911621094, 41.87979507446289, 43.769371032714844, 45.65895080566406, 47.548526763916016, 49.43810272216797, 51.32767868041992, 53.217254638671875, 55.10683059692383, 56.99640655517578, 58.885986328125, 60.77555847167969, 62.665138244628906, 64.55471801757812, 66.44429016113281]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 1.0, 4.0, 4.0, 7.0, 2.0, 7.0, 4.0, 6.0, 15.0, 12.0, 14.0, 18.0, 9.0, 19.0, 17.0, 21.0, 29.0, 35.0, 26.0, 33.0, 32.0, 47.0, 39.0, 38.0, 45.0, 38.0, 44.0, 29.0, 38.0, 42.0, 37.0, 21.0, 32.0, 24.0, 30.0, 30.0, 17.0, 18.0, 16.0, 16.0, 15.0, 14.0, 11.0, 10.0, 8.0, 7.0, 8.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-7.6640625, -7.4420166015625, -7.219970703125, -6.9979248046875, -6.77587890625, -6.5538330078125, -6.331787109375, -6.1097412109375, -5.8876953125, -5.6656494140625, -5.443603515625, -5.2215576171875, -4.99951171875, -4.7774658203125, -4.555419921875, -4.3333740234375, -4.111328125, -3.8892822265625, -3.667236328125, -3.4451904296875, -3.22314453125, -3.0010986328125, -2.779052734375, -2.5570068359375, -2.3349609375, -2.1129150390625, -1.890869140625, -1.6688232421875, -1.44677734375, -1.2247314453125, -1.002685546875, -0.7806396484375, -0.55859375, -0.3365478515625, -0.114501953125, 0.1075439453125, 0.32958984375, 0.5516357421875, 0.773681640625, 0.9957275390625, 1.2177734375, 1.4398193359375, 1.661865234375, 1.8839111328125, 2.10595703125, 2.3280029296875, 2.550048828125, 2.7720947265625, 2.994140625, 3.2161865234375, 3.438232421875, 3.6602783203125, 3.88232421875, 4.1043701171875, 4.326416015625, 4.5484619140625, 4.7705078125, 4.9925537109375, 5.214599609375, 5.4366455078125, 5.65869140625, 5.8807373046875, 6.102783203125, 6.3248291015625, 6.546875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 4.0, 5.0, 9.0, 8.0, 7.0, 23.0, 18.0, 25.0, 22.0, 26.0, 36.0, 42.0, 70.0, 70.0, 124.0, 165.0, 501.0, 2334.0, 26609.0, 491150.0, 2798075.0, 821885.0, 48049.0, 3639.0, 629.0, 208.0, 119.0, 71.0, 60.0, 47.0, 45.0, 38.0, 22.0, 17.0, 20.0, 11.0, 15.0, 10.0, 16.0, 10.0, 7.0, 9.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.1875, -19.60400390625, -19.0205078125, -18.43701171875, -17.853515625, -17.27001953125, -16.6865234375, -16.10302734375, -15.51953125, -14.93603515625, -14.3525390625, -13.76904296875, -13.185546875, -12.60205078125, -12.0185546875, -11.43505859375, -10.8515625, -10.26806640625, -9.6845703125, -9.10107421875, -8.517578125, -7.93408203125, -7.3505859375, -6.76708984375, -6.18359375, -5.60009765625, -5.0166015625, -4.43310546875, -3.849609375, -3.26611328125, -2.6826171875, -2.09912109375, -1.515625, -0.93212890625, -0.3486328125, 0.23486328125, 0.818359375, 1.40185546875, 1.9853515625, 2.56884765625, 3.15234375, 3.73583984375, 4.3193359375, 4.90283203125, 5.486328125, 6.06982421875, 6.6533203125, 7.23681640625, 7.8203125, 8.40380859375, 8.9873046875, 9.57080078125, 10.154296875, 10.73779296875, 11.3212890625, 11.90478515625, 12.48828125, 13.07177734375, 13.6552734375, 14.23876953125, 14.822265625, 15.40576171875, 15.9892578125, 16.57275390625, 17.15625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 16.0, 14.0, 16.0, 12.0, 31.0, 44.0, 59.0, 77.0, 84.0, 121.0, 207.0, 240.0, 357.0, 413.0, 423.0, 432.0, 398.0, 279.0, 218.0, 174.0, 118.0, 93.0, 48.0, 41.0, 44.0, 33.0, 25.0, 10.0, 9.0, 8.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.734375, -12.334716796875, -11.93505859375, -11.535400390625, -11.1357421875, -10.736083984375, -10.33642578125, -9.936767578125, -9.537109375, -9.137451171875, -8.73779296875, -8.338134765625, -7.9384765625, -7.538818359375, -7.13916015625, -6.739501953125, -6.33984375, -5.940185546875, -5.54052734375, -5.140869140625, -4.7412109375, -4.341552734375, -3.94189453125, -3.542236328125, -3.142578125, -2.742919921875, -2.34326171875, -1.943603515625, -1.5439453125, -1.144287109375, -0.74462890625, -0.344970703125, 0.0546875, 0.454345703125, 0.85400390625, 1.253662109375, 1.6533203125, 2.052978515625, 2.45263671875, 2.852294921875, 3.251953125, 3.651611328125, 4.05126953125, 4.450927734375, 4.8505859375, 5.250244140625, 5.64990234375, 6.049560546875, 6.44921875, 6.848876953125, 7.24853515625, 7.648193359375, 8.0478515625, 8.447509765625, 8.84716796875, 9.246826171875, 9.646484375, 10.046142578125, 10.44580078125, 10.845458984375, 11.2451171875, 11.644775390625, 12.04443359375, 12.444091796875, 12.84375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 5.0, 16.0, 10.0, 28.0, 34.0, 35.0, 59.0, 84.0, 115.0, 139.0, 216.0, 340.0, 586.0, 1554.0, 23994.0, 1886895.0, 2248074.0, 28478.0, 1857.0, 564.0, 389.0, 232.0, 143.0, 122.0, 90.0, 68.0, 41.0, 23.0, 29.0, 15.0, 13.0, 13.0, 4.0, 4.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.1875, -40.8701171875, -39.552734375, -38.2353515625, -36.91796875, -35.6005859375, -34.283203125, -32.9658203125, -31.6484375, -30.3310546875, -29.013671875, -27.6962890625, -26.37890625, -25.0615234375, -23.744140625, -22.4267578125, -21.109375, -19.7919921875, -18.474609375, -17.1572265625, -15.83984375, -14.5224609375, -13.205078125, -11.8876953125, -10.5703125, -9.2529296875, -7.935546875, -6.6181640625, -5.30078125, -3.9833984375, -2.666015625, -1.3486328125, -0.03125, 1.2861328125, 2.603515625, 3.9208984375, 5.23828125, 6.5556640625, 7.873046875, 9.1904296875, 10.5078125, 11.8251953125, 13.142578125, 14.4599609375, 15.77734375, 17.0947265625, 18.412109375, 19.7294921875, 21.046875, 22.3642578125, 23.681640625, 24.9990234375, 26.31640625, 27.6337890625, 28.951171875, 30.2685546875, 31.5859375, 32.9033203125, 34.220703125, 35.5380859375, 36.85546875, 38.1728515625, 39.490234375, 40.8076171875, 42.125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [4.0, 44.0, 311.0, 473.0, 172.0, 13.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.403104782104492, -17.038330078125, -9.673555374145508, -2.3087806701660156, 5.055994033813477, 12.420770645141602, 19.78554344177246, 27.15031623840332, 34.51509094238281, 41.87986755371094, 49.2446403503418, 56.609413146972656, 63.97418975830078, 71.3389663696289, 78.7037353515625, 86.06851196289062, 93.43328857421875, 100.79806518554688, 108.162841796875, 115.5276107788086, 122.89238739013672, 130.25717163085938, 137.62193298339844, 144.98670959472656, 152.3514862060547, 159.7162628173828, 167.08103942871094, 174.44581604003906, 181.81057739257812, 189.17535400390625, 196.54013061523438, 203.9049072265625, 211.26968383789062, 218.63446044921875, 225.99923706054688, 233.364013671875, 240.72879028320312, 248.09356689453125, 255.4583282470703, 262.8231201171875, 270.1878662109375, 277.5526428222656, 284.91741943359375, 292.2821960449219, 299.64697265625, 307.0117492675781, 314.37652587890625, 321.74127197265625, 329.1060791015625, 336.4708557128906, 343.83563232421875, 351.2004089355469, 358.565185546875, 365.9299621582031, 373.29473876953125, 380.65948486328125, 388.0242919921875, 395.3890686035156, 402.75384521484375, 410.1186218261719, 417.4833984375, 424.8481750488281, 432.21295166015625, 439.57769775390625, 446.9424743652344]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 7.0, 8.0, 9.0, 13.0, 13.0, 21.0, 21.0, 21.0, 22.0, 28.0, 30.0, 43.0, 45.0, 30.0, 40.0, 54.0, 34.0, 51.0, 41.0, 42.0, 41.0, 26.0, 32.0, 42.0, 39.0, 26.0, 41.0, 31.0, 23.0, 15.0, 13.0, 15.0, 19.0, 13.0, 11.0, 7.0, 4.0, 8.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.55632019042969, -40.210723876953125, -38.86512756347656, -37.51953125, -36.17393493652344, -34.828338623046875, -33.48274230957031, -32.137149810791016, -30.791553497314453, -29.44595718383789, -28.100360870361328, -26.754764556884766, -25.409170150756836, -24.063573837280273, -22.71797752380371, -21.37238311767578, -20.026784896850586, -18.681188583374023, -17.33559226989746, -15.989996910095215, -14.644401550292969, -13.298805236816406, -11.953208923339844, -10.607613563537598, -9.262017250061035, -7.916421413421631, -6.570825576782227, -5.225229263305664, -3.8796334266662598, -2.5340375900268555, -1.188441276550293, 0.15715408325195312, 1.5027503967285156, 2.84834623336792, 4.193942070007324, 5.539538383483887, 6.885134220123291, 8.230730056762695, 9.576326370239258, 10.921921730041504, 12.267518043518066, 13.613114356994629, 14.958709716796875, 16.304306030273438, 17.64990234375, 18.995498657226562, 20.341094970703125, 21.686689376831055, 23.032285690307617, 24.37788200378418, 25.723478317260742, 27.069072723388672, 28.414669036865234, 29.760265350341797, 31.10586166381836, 32.45145797729492, 33.797054290771484, 35.14265060424805, 36.48824691772461, 37.83384323120117, 39.179439544677734, 40.52503204345703, 41.870628356933594, 43.216224670410156, 44.56182098388672]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 7.0, 13.0, 6.0, 14.0, 14.0, 12.0, 14.0, 22.0, 19.0, 25.0, 36.0, 31.0, 32.0, 39.0, 35.0, 30.0, 32.0, 36.0, 42.0, 29.0, 42.0, 43.0, 37.0, 39.0, 35.0, 36.0, 35.0, 24.0, 28.0, 27.0, 21.0, 15.0, 23.0, 14.0, 15.0, 10.0, 9.0, 5.0, 5.0, 12.0, 14.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.10546875, -6.88580322265625, -6.6661376953125, -6.44647216796875, -6.226806640625, -6.00714111328125, -5.7874755859375, -5.56781005859375, -5.34814453125, -5.12847900390625, -4.9088134765625, -4.68914794921875, -4.469482421875, -4.24981689453125, -4.0301513671875, -3.81048583984375, -3.5908203125, -3.37115478515625, -3.1514892578125, -2.93182373046875, -2.712158203125, -2.49249267578125, -2.2728271484375, -2.05316162109375, -1.83349609375, -1.61383056640625, -1.3941650390625, -1.17449951171875, -0.954833984375, -0.73516845703125, -0.5155029296875, -0.29583740234375, -0.076171875, 0.14349365234375, 0.3631591796875, 0.58282470703125, 0.802490234375, 1.02215576171875, 1.2418212890625, 1.46148681640625, 1.68115234375, 1.90081787109375, 2.1204833984375, 2.34014892578125, 2.559814453125, 2.77947998046875, 2.9991455078125, 3.21881103515625, 3.4384765625, 3.65814208984375, 3.8778076171875, 4.09747314453125, 4.317138671875, 4.53680419921875, 4.7564697265625, 4.97613525390625, 5.19580078125, 5.41546630859375, 5.6351318359375, 5.85479736328125, 6.074462890625, 6.29412841796875, 6.5137939453125, 6.73345947265625, 6.953125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 10.0, 8.0, 7.0, 18.0, 23.0, 52.0, 67.0, 97.0, 126.0, 201.0, 254.0, 413.0, 655.0, 925.0, 1310.0, 1958.0, 2895.0, 4426.0, 6730.0, 10317.0, 16351.0, 25792.0, 41047.0, 67624.0, 108619.0, 166660.0, 195391.0, 146904.0, 93714.0, 57747.0, 35526.0, 22121.0, 14065.0, 8879.0, 5860.0, 3892.0, 2543.0, 1745.0, 1153.0, 805.0, 500.0, 367.0, 231.0, 165.0, 127.0, 72.0, 56.0, 42.0, 24.0, 16.0, 14.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.5439453125, -0.5265884399414062, -0.5092315673828125, -0.49187469482421875, -0.474517822265625, -0.45716094970703125, -0.4398040771484375, -0.42244720458984375, -0.40509033203125, -0.38773345947265625, -0.3703765869140625, -0.35301971435546875, -0.335662841796875, -0.31830596923828125, -0.3009490966796875, -0.28359222412109375, -0.2662353515625, -0.24887847900390625, -0.2315216064453125, -0.21416473388671875, -0.196807861328125, -0.17945098876953125, -0.1620941162109375, -0.14473724365234375, -0.12738037109375, -0.11002349853515625, -0.0926666259765625, -0.07530975341796875, -0.057952880859375, -0.04059600830078125, -0.0232391357421875, -0.00588226318359375, 0.011474609375, 0.02883148193359375, 0.0461883544921875, 0.06354522705078125, 0.080902099609375, 0.09825897216796875, 0.1156158447265625, 0.13297271728515625, 0.15032958984375, 0.16768646240234375, 0.1850433349609375, 0.20240020751953125, 0.219757080078125, 0.23711395263671875, 0.2544708251953125, 0.27182769775390625, 0.2891845703125, 0.30654144287109375, 0.3238983154296875, 0.34125518798828125, 0.358612060546875, 0.37596893310546875, 0.3933258056640625, 0.41068267822265625, 0.42803955078125, 0.44539642333984375, 0.4627532958984375, 0.48011016845703125, 0.497467041015625, 0.5148239135742188, 0.5321807861328125, 0.5495376586914062, 0.56689453125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 4.0, 5.0, 12.0, 10.0, 13.0, 9.0, 15.0, 13.0, 25.0, 19.0, 26.0, 22.0, 25.0, 38.0, 33.0, 48.0, 28.0, 31.0, 46.0, 42.0, 55.0, 1068.0, 44.0, 41.0, 37.0, 42.0, 30.0, 33.0, 26.0, 24.0, 20.0, 27.0, 25.0, 15.0, 13.0, 10.0, 7.0, 9.0, 9.0, 5.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0], "bins": [-5.44140625, -5.2904052734375, -5.139404296875, -4.9884033203125, -4.83740234375, -4.6864013671875, -4.535400390625, -4.3843994140625, -4.2333984375, -4.0823974609375, -3.931396484375, -3.7803955078125, -3.62939453125, -3.4783935546875, -3.327392578125, -3.1763916015625, -3.025390625, -2.8743896484375, -2.723388671875, -2.5723876953125, -2.42138671875, -2.2703857421875, -2.119384765625, -1.9683837890625, -1.8173828125, -1.6663818359375, -1.515380859375, -1.3643798828125, -1.21337890625, -1.0623779296875, -0.911376953125, -0.7603759765625, -0.609375, -0.4583740234375, -0.307373046875, -0.1563720703125, -0.00537109375, 0.1456298828125, 0.296630859375, 0.4476318359375, 0.5986328125, 0.7496337890625, 0.900634765625, 1.0516357421875, 1.20263671875, 1.3536376953125, 1.504638671875, 1.6556396484375, 1.806640625, 1.9576416015625, 2.108642578125, 2.2596435546875, 2.41064453125, 2.5616455078125, 2.712646484375, 2.8636474609375, 3.0146484375, 3.1656494140625, 3.316650390625, 3.4676513671875, 3.61865234375, 3.7696533203125, 3.920654296875, 4.0716552734375, 4.22265625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 6.0, 4.0, 20.0, 25.0, 44.0, 44.0, 98.0, 139.0, 245.0, 381.0, 661.0, 1042.0, 1657.0, 2786.0, 4407.0, 7318.0, 11551.0, 18437.0, 30564.0, 50245.0, 83272.0, 134693.0, 1226085.0, 198172.0, 126636.0, 77621.0, 46589.0, 28461.0, 17432.0, 10779.0, 6777.0, 4170.0, 2568.0, 1611.0, 1052.0, 601.0, 383.0, 219.0, 107.0, 90.0, 56.0, 33.0, 26.0, 15.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5361328125, -0.5198516845703125, -0.503570556640625, -0.4872894287109375, -0.47100830078125, -0.4547271728515625, -0.438446044921875, -0.4221649169921875, -0.4058837890625, -0.3896026611328125, -0.373321533203125, -0.3570404052734375, -0.34075927734375, -0.3244781494140625, -0.308197021484375, -0.2919158935546875, -0.275634765625, -0.2593536376953125, -0.243072509765625, -0.2267913818359375, -0.21051025390625, -0.1942291259765625, -0.177947998046875, -0.1616668701171875, -0.1453857421875, -0.1291046142578125, -0.112823486328125, -0.0965423583984375, -0.08026123046875, -0.0639801025390625, -0.047698974609375, -0.0314178466796875, -0.01513671875, 0.0011444091796875, 0.017425537109375, 0.0337066650390625, 0.04998779296875, 0.0662689208984375, 0.082550048828125, 0.0988311767578125, 0.1151123046875, 0.1313934326171875, 0.147674560546875, 0.1639556884765625, 0.18023681640625, 0.1965179443359375, 0.212799072265625, 0.2290802001953125, 0.245361328125, 0.2616424560546875, 0.277923583984375, 0.2942047119140625, 0.31048583984375, 0.3267669677734375, 0.343048095703125, 0.3593292236328125, 0.3756103515625, 0.3918914794921875, 0.408172607421875, 0.4244537353515625, 0.44073486328125, 0.4570159912109375, 0.473297119140625, 0.4895782470703125, 0.505859375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 17.0, 19.0, 18.0, 28.0, 27.0, 32.0, 56.0, 75.0, 78.0, 93.0, 89.0, 87.0, 78.0, 80.0, 58.0, 34.0, 33.0, 20.0, 23.0, 13.0, 10.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002216339111328125, -0.002132326364517212, -0.002048313617706299, -0.0019643008708953857, -0.0018802881240844727, -0.0017962753772735596, -0.0017122626304626465, -0.0016282498836517334, -0.0015442371368408203, -0.0014602243900299072, -0.0013762116432189941, -0.001292198896408081, -0.001208186149597168, -0.0011241734027862549, -0.0010401606559753418, -0.0009561479091644287, -0.0008721351623535156, -0.0007881224155426025, -0.0007041096687316895, -0.0006200969219207764, -0.0005360841751098633, -0.0004520714282989502, -0.0003680586814880371, -0.000284045934677124, -0.00020003318786621094, -0.00011602044105529785, -3.2007694244384766e-05, 5.200505256652832e-05, 0.0001360177993774414, 0.0002200305461883545, 0.0003040432929992676, 0.00038805603981018066, 0.00047206878662109375, 0.0005560815334320068, 0.0006400942802429199, 0.000724107027053833, 0.0008081197738647461, 0.0008921325206756592, 0.0009761452674865723, 0.0010601580142974854, 0.0011441707611083984, 0.0012281835079193115, 0.0013121962547302246, 0.0013962090015411377, 0.0014802217483520508, 0.0015642344951629639, 0.001648247241973877, 0.00173225998878479, 0.0018162727355957031, 0.0019002854824066162, 0.0019842982292175293, 0.0020683109760284424, 0.0021523237228393555, 0.0022363364696502686, 0.0023203492164611816, 0.0024043619632720947, 0.002488374710083008, 0.002572387456893921, 0.002656400203704834, 0.002740412950515747, 0.00282442569732666, 0.0029084384441375732, 0.0029924511909484863, 0.0030764639377593994, 0.0031604766845703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 15.0, 15.0, 15.0, 37.0, 41.0, 62.0, 95.0, 148.0, 248.0, 556.0, 2601.0, 1040640.0, 2823.0, 572.0, 238.0, 147.0, 66.0, 62.0, 50.0, 44.0, 23.0, 15.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0648193359375, -0.06309127807617188, -0.06136322021484375, -0.059635162353515625, -0.0579071044921875, -0.056179046630859375, -0.05445098876953125, -0.052722930908203125, -0.050994873046875, -0.049266815185546875, -0.04753875732421875, -0.045810699462890625, -0.0440826416015625, -0.042354583740234375, -0.04062652587890625, -0.038898468017578125, -0.03717041015625, -0.035442352294921875, -0.03371429443359375, -0.031986236572265625, -0.0302581787109375, -0.028530120849609375, -0.02680206298828125, -0.025074005126953125, -0.023345947265625, -0.021617889404296875, -0.01988983154296875, -0.018161773681640625, -0.0164337158203125, -0.014705657958984375, -0.01297760009765625, -0.011249542236328125, -0.009521484375, -0.007793426513671875, -0.00606536865234375, -0.004337310791015625, -0.0026092529296875, -0.000881195068359375, 0.00084686279296875, 0.002574920654296875, 0.004302978515625, 0.006031036376953125, 0.00775909423828125, 0.009487152099609375, 0.0112152099609375, 0.012943267822265625, 0.01467132568359375, 0.016399383544921875, 0.01812744140625, 0.019855499267578125, 0.02158355712890625, 0.023311614990234375, 0.0250396728515625, 0.026767730712890625, 0.02849578857421875, 0.030223846435546875, 0.031951904296875, 0.033679962158203125, 0.03540802001953125, 0.037136077880859375, 0.0388641357421875, 0.040592193603515625, 0.04232025146484375, 0.044048309326171875, 0.0457763671875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 18.0, 159.0, 428.0, 350.0, 48.0, 12.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007464042864739895, -0.0006164053920656443, -0.00048640643944963813, -0.00035640751593746245, -0.00022640859242528677, -9.640969801694155e-05, 3.358925459906459e-05, 0.00016358820721507072, 0.00029358710162341595, 0.0004235860251355916, 0.0005535849486477673, 0.0006835839012637734, 0.0008135827956721187, 0.0009435816900804639, 0.001073580700904131, 0.0012035795953124762, 0.0013335784897208214, 0.0014635773841291666, 0.0015935762785375118, 0.0017235752893611789, 0.001853574183769524, 0.001983573194593191, 0.0021135720890015364, 0.0022435709834098816, 0.002373569877818227, 0.002503568772226572, 0.0026335676666349173, 0.0027635665610432625, 0.0028935656882822514, 0.003023564349859953, 0.003153563477098942, 0.003283562371507287, 0.0034135612659156322, 0.0035435601603239775, 0.0036735590547323227, 0.003803557949140668, 0.003933556843549013, 0.004063555970788002, 0.004193554632365704, 0.0043235537596046925, 0.004453552886843681, 0.00458355201408267, 0.004713550675660372, 0.004843549802899361, 0.004973548464477062, 0.005103547591716051, 0.005233546253293753, 0.0053635453805327415, 0.005493544042110443, 0.005623543169349432, 0.0057535418309271336, 0.0058835409581661224, 0.006013539619743824, 0.006143538746982813, 0.0062735374085605145, 0.006403536535799503, 0.006533535197377205, 0.006663534324616194, 0.006793532986193895, 0.006923532113432884, 0.007053530775010586, 0.007183529902249575, 0.007313528563827276, 0.007443527691066265, 0.007573526818305254]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 6.0, 5.0, 12.0, 9.0, 9.0, 7.0, 16.0, 16.0, 29.0, 18.0, 22.0, 26.0, 34.0, 28.0, 23.0, 38.0, 36.0, 43.0, 43.0, 42.0, 40.0, 35.0, 44.0, 41.0, 30.0, 41.0, 29.0, 33.0, 37.0, 28.0, 35.0, 25.0, 16.0, 16.0, 18.0, 10.0, 16.0, 11.0, 5.0, 9.0, 7.0, 9.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009061694145202637, -0.0008759219199419022, -0.0008456744253635406, -0.0008154269307851791, -0.0007851794362068176, -0.0007549319416284561, -0.0007246844470500946, -0.0006944369524717331, -0.0006641894578933716, -0.0006339419633150101, -0.0006036944687366486, -0.000573446974158287, -0.0005431994795799255, -0.000512951985001564, -0.0004827044904232025, -0.000452456995844841, -0.0004222095012664795, -0.000391962006688118, -0.00036171451210975647, -0.00033146701753139496, -0.00030121952295303345, -0.00027097202837467194, -0.00024072453379631042, -0.00021047703921794891, -0.0001802295446395874, -0.0001499820500612259, -0.00011973455548286438, -8.948706090450287e-05, -5.923956632614136e-05, -2.8992071747779846e-05, 1.255422830581665e-06, 3.1502917408943176e-05, 6.175041198730469e-05, 9.19979065656662e-05, 0.0001222454011440277, 0.00015249289572238922, 0.00018274039030075073, 0.00021298788487911224, 0.00024323537945747375, 0.00027348287403583527, 0.0003037303686141968, 0.0003339778631925583, 0.0003642253577709198, 0.0003944728523492813, 0.0004247203469276428, 0.00045496784150600433, 0.00048521533608436584, 0.0005154628306627274, 0.0005457103252410889, 0.0005759578198194504, 0.0006062053143978119, 0.0006364528089761734, 0.0006667003035545349, 0.0006969477981328964, 0.0007271952927112579, 0.0007574427872896194, 0.000787690281867981, 0.0008179377764463425, 0.000848185271024704, 0.0008784327656030655, 0.000908680260181427, 0.0009389277547597885, 0.00096917524933815, 0.0009994227439165115, 0.001029670238494873]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 7.0, 13.0, 6.0, 14.0, 14.0, 12.0, 14.0, 22.0, 19.0, 25.0, 36.0, 30.0, 33.0, 39.0, 35.0, 30.0, 32.0, 37.0, 41.0, 29.0, 42.0, 43.0, 37.0, 39.0, 35.0, 36.0, 35.0, 24.0, 28.0, 27.0, 21.0, 15.0, 23.0, 14.0, 15.0, 10.0, 9.0, 5.0, 5.0, 12.0, 14.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.10546875, -6.88580322265625, -6.6661376953125, -6.44647216796875, -6.226806640625, -6.00714111328125, -5.7874755859375, -5.56781005859375, -5.34814453125, -5.12847900390625, -4.9088134765625, -4.68914794921875, -4.469482421875, -4.24981689453125, -4.0301513671875, -3.81048583984375, -3.5908203125, -3.37115478515625, -3.1514892578125, -2.93182373046875, -2.712158203125, -2.49249267578125, -2.2728271484375, -2.05316162109375, -1.83349609375, -1.61383056640625, -1.3941650390625, -1.17449951171875, -0.954833984375, -0.73516845703125, -0.5155029296875, -0.29583740234375, -0.076171875, 0.14349365234375, 0.3631591796875, 0.58282470703125, 0.802490234375, 1.02215576171875, 1.2418212890625, 1.46148681640625, 1.68115234375, 1.90081787109375, 2.1204833984375, 2.34014892578125, 2.559814453125, 2.77947998046875, 2.9991455078125, 3.21881103515625, 3.4384765625, 3.65814208984375, 3.8778076171875, 4.09747314453125, 4.317138671875, 4.53680419921875, 4.7564697265625, 4.97613525390625, 5.19580078125, 5.41546630859375, 5.6351318359375, 5.85479736328125, 6.074462890625, 6.29412841796875, 6.5137939453125, 6.73345947265625, 6.953125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 9.0, 4.0, 8.0, 14.0, 16.0, 19.0, 26.0, 38.0, 45.0, 58.0, 54.0, 99.0, 107.0, 137.0, 228.0, 376.0, 769.0, 2184.0, 7234.0, 25169.0, 105291.0, 489146.0, 326764.0, 65662.0, 16896.0, 4921.0, 1544.0, 583.0, 335.0, 209.0, 139.0, 98.0, 89.0, 61.0, 46.0, 42.0, 30.0, 20.0, 21.0, 19.0, 11.0, 10.0, 7.0, 6.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.421875, -12.0191650390625, -11.616455078125, -11.2137451171875, -10.81103515625, -10.4083251953125, -10.005615234375, -9.6029052734375, -9.2001953125, -8.7974853515625, -8.394775390625, -7.9920654296875, -7.58935546875, -7.1866455078125, -6.783935546875, -6.3812255859375, -5.978515625, -5.5758056640625, -5.173095703125, -4.7703857421875, -4.36767578125, -3.9649658203125, -3.562255859375, -3.1595458984375, -2.7568359375, -2.3541259765625, -1.951416015625, -1.5487060546875, -1.14599609375, -0.7432861328125, -0.340576171875, 0.0621337890625, 0.46484375, 0.8675537109375, 1.270263671875, 1.6729736328125, 2.07568359375, 2.4783935546875, 2.881103515625, 3.2838134765625, 3.6865234375, 4.0892333984375, 4.491943359375, 4.8946533203125, 5.29736328125, 5.7000732421875, 6.102783203125, 6.5054931640625, 6.908203125, 7.3109130859375, 7.713623046875, 8.1163330078125, 8.51904296875, 8.9217529296875, 9.324462890625, 9.7271728515625, 10.1298828125, 10.5325927734375, 10.935302734375, 11.3380126953125, 11.74072265625, 12.1434326171875, 12.546142578125, 12.9488525390625, 13.3515625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 8.0, 3.0, 2.0, 7.0, 5.0, 8.0, 7.0, 11.0, 14.0, 19.0, 21.0, 22.0, 16.0, 25.0, 34.0, 21.0, 28.0, 35.0, 48.0, 49.0, 70.0, 97.0, 254.0, 1449.0, 242.0, 114.0, 51.0, 52.0, 47.0, 35.0, 33.0, 30.0, 20.0, 25.0, 28.0, 23.0, 12.0, 21.0, 16.0, 11.0, 9.0, 8.0, 4.0, 4.0, 9.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-23.78125, -23.072998046875, -22.36474609375, -21.656494140625, -20.9482421875, -20.239990234375, -19.53173828125, -18.823486328125, -18.115234375, -17.406982421875, -16.69873046875, -15.990478515625, -15.2822265625, -14.573974609375, -13.86572265625, -13.157470703125, -12.44921875, -11.740966796875, -11.03271484375, -10.324462890625, -9.6162109375, -8.907958984375, -8.19970703125, -7.491455078125, -6.783203125, -6.074951171875, -5.36669921875, -4.658447265625, -3.9501953125, -3.241943359375, -2.53369140625, -1.825439453125, -1.1171875, -0.408935546875, 0.29931640625, 1.007568359375, 1.7158203125, 2.424072265625, 3.13232421875, 3.840576171875, 4.548828125, 5.257080078125, 5.96533203125, 6.673583984375, 7.3818359375, 8.090087890625, 8.79833984375, 9.506591796875, 10.21484375, 10.923095703125, 11.63134765625, 12.339599609375, 13.0478515625, 13.756103515625, 14.46435546875, 15.172607421875, 15.880859375, 16.589111328125, 17.29736328125, 18.005615234375, 18.7138671875, 19.422119140625, 20.13037109375, 20.838623046875, 21.546875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 7.0, 8.0, 12.0, 16.0, 15.0, 26.0, 24.0, 51.0, 51.0, 62.0, 89.0, 105.0, 173.0, 361.0, 762.0, 3685.0, 909502.0, 2223871.0, 4937.0, 873.0, 376.0, 188.0, 119.0, 101.0, 63.0, 47.0, 39.0, 44.0, 20.0, 19.0, 12.0, 8.0, 11.0, 9.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.625, -59.57421875, -57.5234375, -55.47265625, -53.421875, -51.37109375, -49.3203125, -47.26953125, -45.21875, -43.16796875, -41.1171875, -39.06640625, -37.015625, -34.96484375, -32.9140625, -30.86328125, -28.8125, -26.76171875, -24.7109375, -22.66015625, -20.609375, -18.55859375, -16.5078125, -14.45703125, -12.40625, -10.35546875, -8.3046875, -6.25390625, -4.203125, -2.15234375, -0.1015625, 1.94921875, 4.0, 6.05078125, 8.1015625, 10.15234375, 12.203125, 14.25390625, 16.3046875, 18.35546875, 20.40625, 22.45703125, 24.5078125, 26.55859375, 28.609375, 30.66015625, 32.7109375, 34.76171875, 36.8125, 38.86328125, 40.9140625, 42.96484375, 45.015625, 47.06640625, 49.1171875, 51.16796875, 53.21875, 55.26953125, 57.3203125, 59.37109375, 61.421875, 63.47265625, 65.5234375, 67.57421875, 69.625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 11.0, 18.0, 57.0, 76.0, 121.0, 137.0, 157.0, 158.0, 126.0, 75.0, 40.0, 18.0, 15.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.489408493041992, -11.192358016967773, -9.895307540893555, -8.59825611114502, -7.301205635070801, -6.004155158996582, -4.707104206085205, -3.410053253173828, -2.1130027770996094, -0.8159520626068115, 0.48109865188598633, 1.7781493663787842, 3.075200080871582, 4.372250556945801, 5.669301509857178, 6.966352462768555, 8.263402938842773, 9.560453414916992, 10.857503890991211, 12.154555320739746, 13.451605796813965, 14.748656272888184, 16.04570770263672, 17.342758178710938, 18.639808654785156, 19.936859130859375, 21.233909606933594, 22.530960083007812, 23.82801055908203, 25.12506103515625, 26.4221134185791, 27.71916389465332, 29.016212463378906, 30.313262939453125, 31.610313415527344, 32.90736389160156, 34.20441436767578, 35.50146484375, 36.79851531982422, 38.09556579589844, 39.392616271972656, 40.689666748046875, 41.986717224121094, 43.28376770019531, 44.58081817626953, 45.87786865234375, 47.17491912841797, 48.47196960449219, 49.76902389526367, 51.06607437133789, 52.36312484741211, 53.66017532348633, 54.95722579956055, 56.254276275634766, 57.551326751708984, 58.84838104248047, 60.14543151855469, 61.442481994628906, 62.739532470703125, 64.03658294677734, 65.33363342285156, 66.63068389892578, 67.927734375, 69.22478485107422, 70.52183532714844]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 4.0, 8.0, 7.0, 8.0, 12.0, 9.0, 13.0, 15.0, 14.0, 22.0, 21.0, 22.0, 23.0, 29.0, 28.0, 21.0, 28.0, 33.0, 29.0, 41.0, 34.0, 38.0, 43.0, 39.0, 35.0, 48.0, 30.0, 40.0, 34.0, 32.0, 24.0, 32.0, 27.0, 20.0, 17.0, 19.0, 15.0, 12.0, 14.0, 5.0, 4.0, 7.0, 7.0, 12.0, 4.0, 4.0, 1.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-54.7220344543457, -53.028076171875, -51.3341178894043, -49.640159606933594, -47.94620132446289, -46.25224304199219, -44.558284759521484, -42.86432647705078, -41.17036819458008, -39.476409912109375, -37.78245162963867, -36.08849334716797, -34.394535064697266, -32.70057678222656, -31.00661849975586, -29.312660217285156, -27.618703842163086, -25.924745559692383, -24.23078727722168, -22.536828994750977, -20.842870712280273, -19.148914337158203, -17.4549560546875, -15.76099681854248, -14.067038536071777, -12.373080253601074, -10.679121971130371, -8.985164642333984, -7.291205883026123, -5.597248077392578, -3.903289794921875, -2.209331512451172, -0.5153732299804688, 1.1785849332809448, 2.8725430965423584, 4.566501140594482, 6.2604594230651855, 7.9544172286987305, 9.648375511169434, 11.342333793640137, 13.03629207611084, 14.730250358581543, 16.42420768737793, 18.118165969848633, 19.812124252319336, 21.50608253479004, 23.200040817260742, 24.893999099731445, 26.58795738220215, 28.28191566467285, 29.975873947143555, 31.669832229614258, 33.36378860473633, 35.05774688720703, 36.751705169677734, 38.44566345214844, 40.13962173461914, 41.833580017089844, 43.52753829956055, 45.22149658203125, 46.91545486450195, 48.609413146972656, 50.30337142944336, 51.99732971191406, 53.691287994384766]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 10.0, 8.0, 8.0, 9.0, 10.0, 14.0, 11.0, 18.0, 28.0, 25.0, 24.0, 33.0, 44.0, 32.0, 32.0, 40.0, 35.0, 37.0, 31.0, 40.0, 36.0, 49.0, 38.0, 35.0, 33.0, 41.0, 24.0, 38.0, 27.0, 23.0, 25.0, 17.0, 24.0, 18.0, 17.0, 11.0, 10.0, 15.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.46136474609375, -7.2196044921875, -6.97784423828125, -6.736083984375, -6.49432373046875, -6.2525634765625, -6.01080322265625, -5.76904296875, -5.52728271484375, -5.2855224609375, -5.04376220703125, -4.802001953125, -4.56024169921875, -4.3184814453125, -4.07672119140625, -3.8349609375, -3.59320068359375, -3.3514404296875, -3.10968017578125, -2.867919921875, -2.62615966796875, -2.3843994140625, -2.14263916015625, -1.90087890625, -1.65911865234375, -1.4173583984375, -1.17559814453125, -0.933837890625, -0.69207763671875, -0.4503173828125, -0.20855712890625, 0.033203125, 0.27496337890625, 0.5167236328125, 0.75848388671875, 1.000244140625, 1.24200439453125, 1.4837646484375, 1.72552490234375, 1.96728515625, 2.20904541015625, 2.4508056640625, 2.69256591796875, 2.934326171875, 3.17608642578125, 3.4178466796875, 3.65960693359375, 3.9013671875, 4.14312744140625, 4.3848876953125, 4.62664794921875, 4.868408203125, 5.11016845703125, 5.3519287109375, 5.59368896484375, 5.83544921875, 6.07720947265625, 6.3189697265625, 6.56072998046875, 6.802490234375, 7.04425048828125, 7.2860107421875, 7.52777099609375, 7.76953125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 1.0, 6.0, 5.0, 4.0, 12.0, 13.0, 9.0, 20.0, 23.0, 33.0, 44.0, 51.0, 55.0, 104.0, 118.0, 281.0, 1000.0, 5888.0, 59876.0, 779520.0, 2615453.0, 673548.0, 51583.0, 5027.0, 851.0, 245.0, 138.0, 85.0, 51.0, 42.0, 50.0, 23.0, 20.0, 22.0, 18.0, 12.0, 16.0, 10.0, 10.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.125, -16.580810546875, -16.03662109375, -15.492431640625, -14.9482421875, -14.404052734375, -13.85986328125, -13.315673828125, -12.771484375, -12.227294921875, -11.68310546875, -11.138916015625, -10.5947265625, -10.050537109375, -9.50634765625, -8.962158203125, -8.41796875, -7.873779296875, -7.32958984375, -6.785400390625, -6.2412109375, -5.697021484375, -5.15283203125, -4.608642578125, -4.064453125, -3.520263671875, -2.97607421875, -2.431884765625, -1.8876953125, -1.343505859375, -0.79931640625, -0.255126953125, 0.2890625, 0.833251953125, 1.37744140625, 1.921630859375, 2.4658203125, 3.010009765625, 3.55419921875, 4.098388671875, 4.642578125, 5.186767578125, 5.73095703125, 6.275146484375, 6.8193359375, 7.363525390625, 7.90771484375, 8.451904296875, 8.99609375, 9.540283203125, 10.08447265625, 10.628662109375, 11.1728515625, 11.717041015625, 12.26123046875, 12.805419921875, 13.349609375, 13.893798828125, 14.43798828125, 14.982177734375, 15.5263671875, 16.070556640625, 16.61474609375, 17.158935546875, 17.703125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 9.0, 8.0, 12.0, 13.0, 17.0, 22.0, 25.0, 30.0, 42.0, 56.0, 90.0, 122.0, 183.0, 202.0, 302.0, 353.0, 402.0, 386.0, 403.0, 349.0, 253.0, 212.0, 151.0, 109.0, 82.0, 62.0, 45.0, 33.0, 23.0, 12.0, 11.0, 10.0, 10.0, 6.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-14.3515625, -13.9771728515625, -13.602783203125, -13.2283935546875, -12.85400390625, -12.4796142578125, -12.105224609375, -11.7308349609375, -11.3564453125, -10.9820556640625, -10.607666015625, -10.2332763671875, -9.85888671875, -9.4844970703125, -9.110107421875, -8.7357177734375, -8.361328125, -7.9869384765625, -7.612548828125, -7.2381591796875, -6.86376953125, -6.4893798828125, -6.114990234375, -5.7406005859375, -5.3662109375, -4.9918212890625, -4.617431640625, -4.2430419921875, -3.86865234375, -3.4942626953125, -3.119873046875, -2.7454833984375, -2.37109375, -1.9967041015625, -1.622314453125, -1.2479248046875, -0.87353515625, -0.4991455078125, -0.124755859375, 0.2496337890625, 0.6240234375, 0.9984130859375, 1.372802734375, 1.7471923828125, 2.12158203125, 2.4959716796875, 2.870361328125, 3.2447509765625, 3.619140625, 3.9935302734375, 4.367919921875, 4.7423095703125, 5.11669921875, 5.4910888671875, 5.865478515625, 6.2398681640625, 6.6142578125, 6.9886474609375, 7.363037109375, 7.7374267578125, 8.11181640625, 8.4862060546875, 8.860595703125, 9.2349853515625, 9.609375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 11.0, 12.0, 20.0, 32.0, 24.0, 52.0, 51.0, 84.0, 115.0, 162.0, 219.0, 343.0, 566.0, 1360.0, 5952.0, 66461.0, 1757990.0, 2262799.0, 87553.0, 7194.0, 1443.0, 639.0, 354.0, 227.0, 158.0, 112.0, 90.0, 63.0, 47.0, 31.0, 31.0, 18.0, 17.0, 13.0, 8.0, 9.0, 7.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.0625, -26.130859375, -25.19921875, -24.267578125, -23.3359375, -22.404296875, -21.47265625, -20.541015625, -19.609375, -18.677734375, -17.74609375, -16.814453125, -15.8828125, -14.951171875, -14.01953125, -13.087890625, -12.15625, -11.224609375, -10.29296875, -9.361328125, -8.4296875, -7.498046875, -6.56640625, -5.634765625, -4.703125, -3.771484375, -2.83984375, -1.908203125, -0.9765625, -0.044921875, 0.88671875, 1.818359375, 2.75, 3.681640625, 4.61328125, 5.544921875, 6.4765625, 7.408203125, 8.33984375, 9.271484375, 10.203125, 11.134765625, 12.06640625, 12.998046875, 13.9296875, 14.861328125, 15.79296875, 16.724609375, 17.65625, 18.587890625, 19.51953125, 20.451171875, 21.3828125, 22.314453125, 23.24609375, 24.177734375, 25.109375, 26.041015625, 26.97265625, 27.904296875, 28.8359375, 29.767578125, 30.69921875, 31.630859375, 32.5625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 54.0, 513.0, 419.0, 28.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.686092376708984, -50.46839141845703, -40.250694274902344, -30.032995223999023, -19.815296173095703, -9.597599029541016, 0.6201019287109375, 10.83780288696289, 21.055500030517578, 31.2731990814209, 41.49089813232422, 51.708595275878906, 61.92629623413086, 72.14399719238281, 82.3616943359375, 92.57939147949219, 102.79708862304688, 113.01478576660156, 123.23248291015625, 133.45018005371094, 143.66787719726562, 153.88558959960938, 164.10328674316406, 174.32098388671875, 184.53868103027344, 194.75637817382812, 204.9740753173828, 215.1917724609375, 225.40948486328125, 235.62716674804688, 245.84487915039062, 256.06256103515625, 266.2802734375, 276.49798583984375, 286.7156677246094, 296.9333801269531, 307.15106201171875, 317.3687744140625, 327.5864562988281, 337.8041687011719, 348.0218505859375, 358.23956298828125, 368.4572448730469, 378.6749572753906, 388.89263916015625, 399.1103515625, 409.3280334472656, 419.5457458496094, 429.7634582519531, 439.9811706542969, 450.1988525390625, 460.41656494140625, 470.6342468261719, 480.8519592285156, 491.06964111328125, 501.287353515625, 511.50506591796875, 521.7227783203125, 531.9404907226562, 542.1581420898438, 552.3758544921875, 562.5935668945312, 572.811279296875, 583.0289306640625, 593.2466430664062]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 5.0, 7.0, 6.0, 7.0, 8.0, 15.0, 17.0, 14.0, 22.0, 17.0, 26.0, 31.0, 30.0, 28.0, 47.0, 43.0, 31.0, 41.0, 35.0, 58.0, 32.0, 43.0, 38.0, 33.0, 35.0, 30.0, 29.0, 27.0, 35.0, 27.0, 27.0, 17.0, 26.0, 13.0, 21.0, 11.0, 13.0, 14.0, 8.0, 4.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-45.06510925292969, -43.67557907104492, -42.286048889160156, -40.89651870727539, -39.506988525390625, -38.11745834350586, -36.727928161621094, -35.33839797973633, -33.94886779785156, -32.5593376159668, -31.16980743408203, -29.780277252197266, -28.3907470703125, -27.001216888427734, -25.61168670654297, -24.222156524658203, -22.83262825012207, -21.443098068237305, -20.05356788635254, -18.664037704467773, -17.274507522583008, -15.884977340698242, -14.495448112487793, -13.105917930603027, -11.716387748718262, -10.326857566833496, -8.93732738494873, -7.547797679901123, -6.158267498016357, -4.768737316131592, -3.3792076110839844, -1.9896774291992188, -0.6001472473144531, 0.789382815361023, 2.178912878036499, 3.5684428215026855, 4.957973003387451, 6.347503185272217, 7.737032890319824, 9.12656307220459, 10.516093254089355, 11.905623435974121, 13.295153617858887, 14.684682846069336, 16.0742130279541, 17.463743209838867, 18.853273391723633, 20.2428035736084, 21.632333755493164, 23.02186393737793, 24.411394119262695, 25.80092430114746, 27.190454483032227, 28.579984664916992, 29.969512939453125, 31.35904312133789, 32.748573303222656, 34.13810348510742, 35.52763366699219, 36.91716384887695, 38.30669403076172, 39.696224212646484, 41.08575439453125, 42.475284576416016, 43.86481475830078]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 7.0, 7.0, 12.0, 11.0, 12.0, 12.0, 20.0, 22.0, 22.0, 28.0, 27.0, 32.0, 24.0, 35.0, 33.0, 26.0, 31.0, 35.0, 38.0, 50.0, 42.0, 36.0, 37.0, 34.0, 44.0, 34.0, 33.0, 37.0, 32.0, 24.0, 25.0, 17.0, 13.0, 20.0, 16.0, 12.0, 9.0, 11.0, 2.0, 10.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.515625, -7.27972412109375, -7.0438232421875, -6.80792236328125, -6.572021484375, -6.33612060546875, -6.1002197265625, -5.86431884765625, -5.62841796875, -5.39251708984375, -5.1566162109375, -4.92071533203125, -4.684814453125, -4.44891357421875, -4.2130126953125, -3.97711181640625, -3.7412109375, -3.50531005859375, -3.2694091796875, -3.03350830078125, -2.797607421875, -2.56170654296875, -2.3258056640625, -2.08990478515625, -1.85400390625, -1.61810302734375, -1.3822021484375, -1.14630126953125, -0.910400390625, -0.67449951171875, -0.4385986328125, -0.20269775390625, 0.033203125, 0.26910400390625, 0.5050048828125, 0.74090576171875, 0.976806640625, 1.21270751953125, 1.4486083984375, 1.68450927734375, 1.92041015625, 2.15631103515625, 2.3922119140625, 2.62811279296875, 2.864013671875, 3.09991455078125, 3.3358154296875, 3.57171630859375, 3.8076171875, 4.04351806640625, 4.2794189453125, 4.51531982421875, 4.751220703125, 4.98712158203125, 5.2230224609375, 5.45892333984375, 5.69482421875, 5.93072509765625, 6.1666259765625, 6.40252685546875, 6.638427734375, 6.87432861328125, 7.1102294921875, 7.34613037109375, 7.58203125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 11.0, 13.0, 19.0, 40.0, 60.0, 115.0, 180.0, 267.0, 434.0, 717.0, 1091.0, 1775.0, 2791.0, 4649.0, 7332.0, 12090.0, 19904.0, 32964.0, 54303.0, 91099.0, 150663.0, 218324.0, 176339.0, 108377.0, 64810.0, 39339.0, 23482.0, 14361.0, 8760.0, 5472.0, 3392.0, 2024.0, 1211.0, 830.0, 480.0, 298.0, 200.0, 132.0, 74.0, 48.0, 36.0, 14.0, 13.0, 4.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60009765625, -0.5798721313476562, -0.5596466064453125, -0.5394210815429688, -0.519195556640625, -0.49897003173828125, -0.4787445068359375, -0.45851898193359375, -0.43829345703125, -0.41806793212890625, -0.3978424072265625, -0.37761688232421875, -0.357391357421875, -0.33716583251953125, -0.3169403076171875, -0.29671478271484375, -0.2764892578125, -0.25626373291015625, -0.2360382080078125, -0.21581268310546875, -0.195587158203125, -0.17536163330078125, -0.1551361083984375, -0.13491058349609375, -0.11468505859375, -0.09445953369140625, -0.0742340087890625, -0.05400848388671875, -0.033782958984375, -0.01355743408203125, 0.0066680908203125, 0.02689361572265625, 0.047119140625, 0.06734466552734375, 0.0875701904296875, 0.10779571533203125, 0.128021240234375, 0.14824676513671875, 0.1684722900390625, 0.18869781494140625, 0.20892333984375, 0.22914886474609375, 0.2493743896484375, 0.26959991455078125, 0.289825439453125, 0.31005096435546875, 0.3302764892578125, 0.35050201416015625, 0.3707275390625, 0.39095306396484375, 0.4111785888671875, 0.43140411376953125, 0.451629638671875, 0.47185516357421875, 0.4920806884765625, 0.5123062133789062, 0.53253173828125, 0.5527572631835938, 0.5729827880859375, 0.5932083129882812, 0.613433837890625, 0.6336593627929688, 0.6538848876953125, 0.6741104125976562, 0.6943359375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 8.0, 6.0, 15.0, 5.0, 22.0, 8.0, 16.0, 15.0, 16.0, 16.0, 17.0, 26.0, 25.0, 22.0, 23.0, 23.0, 25.0, 30.0, 28.0, 34.0, 36.0, 1059.0, 51.0, 43.0, 38.0, 25.0, 37.0, 27.0, 33.0, 32.0, 31.0, 26.0, 33.0, 17.0, 20.0, 14.0, 19.0, 18.0, 14.0, 8.0, 13.0, 10.0, 6.0, 4.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-4.546875, -4.404296875, -4.26171875, -4.119140625, -3.9765625, -3.833984375, -3.69140625, -3.548828125, -3.40625, -3.263671875, -3.12109375, -2.978515625, -2.8359375, -2.693359375, -2.55078125, -2.408203125, -2.265625, -2.123046875, -1.98046875, -1.837890625, -1.6953125, -1.552734375, -1.41015625, -1.267578125, -1.125, -0.982421875, -0.83984375, -0.697265625, -0.5546875, -0.412109375, -0.26953125, -0.126953125, 0.015625, 0.158203125, 0.30078125, 0.443359375, 0.5859375, 0.728515625, 0.87109375, 1.013671875, 1.15625, 1.298828125, 1.44140625, 1.583984375, 1.7265625, 1.869140625, 2.01171875, 2.154296875, 2.296875, 2.439453125, 2.58203125, 2.724609375, 2.8671875, 3.009765625, 3.15234375, 3.294921875, 3.4375, 3.580078125, 3.72265625, 3.865234375, 4.0078125, 4.150390625, 4.29296875, 4.435546875, 4.578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 10.0, 10.0, 16.0, 22.0, 22.0, 30.0, 79.0, 109.0, 135.0, 241.0, 343.0, 533.0, 811.0, 1209.0, 1848.0, 2676.0, 4091.0, 6297.0, 9261.0, 14092.0, 21283.0, 32121.0, 48358.0, 73198.0, 110175.0, 155831.0, 1217841.0, 132330.0, 89912.0, 58689.0, 38923.0, 25692.0, 17271.0, 11404.0, 7479.0, 4998.0, 3301.0, 2251.0, 1434.0, 987.0, 582.0, 430.0, 290.0, 177.0, 126.0, 75.0, 41.0, 38.0, 14.0, 20.0, 14.0, 8.0, 7.0, 0.0, 0.0, 3.0, 6.0], "bins": [-0.5009765625, -0.4859046936035156, -0.47083282470703125, -0.4557609558105469, -0.4406890869140625, -0.4256172180175781, -0.41054534912109375, -0.3954734802246094, -0.380401611328125, -0.3653297424316406, -0.35025787353515625, -0.3351860046386719, -0.3201141357421875, -0.3050422668457031, -0.28997039794921875, -0.2748985290527344, -0.25982666015625, -0.24475479125976562, -0.22968292236328125, -0.21461105346679688, -0.1995391845703125, -0.18446731567382812, -0.16939544677734375, -0.15432357788085938, -0.139251708984375, -0.12417984008789062, -0.10910797119140625, -0.09403610229492188, -0.0789642333984375, -0.06389236450195312, -0.04882049560546875, -0.033748626708984375, -0.0186767578125, -0.003604888916015625, 0.01146697998046875, 0.026538848876953125, 0.0416107177734375, 0.056682586669921875, 0.07175445556640625, 0.08682632446289062, 0.101898193359375, 0.11697006225585938, 0.13204193115234375, 0.14711380004882812, 0.1621856689453125, 0.17725753784179688, 0.19232940673828125, 0.20740127563476562, 0.22247314453125, 0.23754501342773438, 0.25261688232421875, 0.2676887512207031, 0.2827606201171875, 0.2978324890136719, 0.31290435791015625, 0.3279762268066406, 0.343048095703125, 0.3581199645996094, 0.37319183349609375, 0.3882637023925781, 0.4033355712890625, 0.4184074401855469, 0.43347930908203125, 0.4485511779785156, 0.463623046875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 2.0, 5.0, 6.0, 7.0, 9.0, 4.0, 8.0, 3.0, 18.0, 26.0, 24.0, 20.0, 18.0, 30.0, 37.0, 28.0, 37.0, 37.0, 51.0, 50.0, 49.0, 58.0, 55.0, 49.0, 52.0, 32.0, 48.0, 28.0, 34.0, 26.0, 25.0, 21.0, 15.0, 15.0, 17.0, 6.0, 8.0, 9.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0018224716186523438, -0.0017688721418380737, -0.0017152726650238037, -0.0016616731882095337, -0.0016080737113952637, -0.0015544742345809937, -0.0015008747577667236, -0.0014472752809524536, -0.0013936758041381836, -0.0013400763273239136, -0.0012864768505096436, -0.0012328773736953735, -0.0011792778968811035, -0.0011256784200668335, -0.0010720789432525635, -0.0010184794664382935, -0.0009648799896240234, -0.0009112805128097534, -0.0008576810359954834, -0.0008040815591812134, -0.0007504820823669434, -0.0006968826055526733, -0.0006432831287384033, -0.0005896836519241333, -0.0005360841751098633, -0.00048248469829559326, -0.00042888522148132324, -0.0003752857446670532, -0.0003216862678527832, -0.0002680867910385132, -0.00021448731422424316, -0.00016088783740997314, -0.00010728836059570312, -5.3688883781433105e-05, -8.940696716308594e-08, 5.3510069847106934e-05, 0.00010710954666137695, 0.00016070902347564697, 0.000214308500289917, 0.000267907977104187, 0.00032150745391845703, 0.00037510693073272705, 0.00042870640754699707, 0.0004823058843612671, 0.0005359053611755371, 0.0005895048379898071, 0.0006431043148040771, 0.0006967037916183472, 0.0007503032684326172, 0.0008039027452468872, 0.0008575022220611572, 0.0009111016988754272, 0.0009647011756896973, 0.0010183006525039673, 0.0010719001293182373, 0.0011254996061325073, 0.0011790990829467773, 0.0012326985597610474, 0.0012862980365753174, 0.0013398975133895874, 0.0013934969902038574, 0.0014470964670181274, 0.0015006959438323975, 0.0015542954206466675, 0.0016078948974609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 5.0, 9.0, 11.0, 17.0, 32.0, 21.0, 33.0, 41.0, 46.0, 71.0, 94.0, 124.0, 193.0, 316.0, 617.0, 1793.0, 854170.0, 188401.0, 1115.0, 499.0, 273.0, 154.0, 104.0, 85.0, 63.0, 54.0, 47.0, 22.0, 25.0, 17.0, 12.0, 13.0, 13.0, 10.0, 6.0, 2.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.037353515625, -0.03614377975463867, -0.034934043884277344, -0.033724308013916016, -0.03251457214355469, -0.03130483627319336, -0.03009510040283203, -0.028885364532470703, -0.027675628662109375, -0.026465892791748047, -0.02525615692138672, -0.02404642105102539, -0.022836685180664062, -0.021626949310302734, -0.020417213439941406, -0.019207477569580078, -0.01799774169921875, -0.016788005828857422, -0.015578269958496094, -0.014368534088134766, -0.013158798217773438, -0.01194906234741211, -0.010739326477050781, -0.009529590606689453, -0.008319854736328125, -0.007110118865966797, -0.005900382995605469, -0.004690647125244141, -0.0034809112548828125, -0.0022711753845214844, -0.0010614395141601562, 0.00014829635620117188, 0.0013580322265625, 0.002567768096923828, 0.0037775039672851562, 0.004987239837646484, 0.0061969757080078125, 0.007406711578369141, 0.008616447448730469, 0.009826183319091797, 0.011035919189453125, 0.012245655059814453, 0.013455390930175781, 0.01466512680053711, 0.015874862670898438, 0.017084598541259766, 0.018294334411621094, 0.019504070281982422, 0.02071380615234375, 0.021923542022705078, 0.023133277893066406, 0.024343013763427734, 0.025552749633789062, 0.02676248550415039, 0.02797222137451172, 0.029181957244873047, 0.030391693115234375, 0.0316014289855957, 0.03281116485595703, 0.03402090072631836, 0.03523063659667969, 0.036440372467041016, 0.037650108337402344, 0.03885984420776367, 0.040069580078125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 247.0, 738.0, 25.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01695728488266468, -0.016632722690701485, -0.01630816049873829, -0.015983598306775093, -0.015659036114811897, -0.015334473922848701, -0.015009911730885506, -0.01468534953892231, -0.014360787346959114, -0.014036225154995918, -0.013711662963032722, -0.013387100771069527, -0.013062538579106331, -0.012737976387143135, -0.01241341419517994, -0.012088852003216743, -0.011764289811253548, -0.011439727619290352, -0.011115165427327156, -0.01079060323536396, -0.010466041043400764, -0.010141478851437569, -0.009816916659474373, -0.009492354467511177, -0.009167792275547981, -0.008843230083584785, -0.00851866789162159, -0.008194105699658394, -0.007869543507695198, -0.007544981315732002, -0.0072204191237688065, -0.006895856931805611, -0.006571294739842415, -0.006246732547879219, -0.005922170355916023, -0.0055976081639528275, -0.005273045971989632, -0.004948483780026436, -0.00462392158806324, -0.004299359396100044, -0.0039747972041368484, -0.0036502350121736526, -0.003325672820210457, -0.003001110628247261, -0.0026765484362840652, -0.0023519862443208694, -0.0020274240523576736, -0.0017028618603944778, -0.0013782994356006384, -0.0010537372436374426, -0.0007291750516742468, -0.000404612859711051, -8.005066774785519e-05, 0.0002445115242153406, 0.0005690737161785364, 0.0008936359081417322, 0.001218198100104928, 0.0015427602920681238, 0.0018673224840313196, 0.0021918846759945154, 0.0025164468679577112, 0.002841009059920907, 0.003165571251884103, 0.0034901334438472986, 0.0038146956358104944]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 7.0, 9.0, 9.0, 7.0, 15.0, 15.0, 20.0, 19.0, 22.0, 25.0, 30.0, 30.0, 38.0, 35.0, 36.0, 47.0, 32.0, 38.0, 50.0, 39.0, 38.0, 41.0, 45.0, 38.0, 36.0, 36.0, 29.0, 29.0, 30.0, 17.0, 21.0, 27.0, 15.0, 14.0, 11.0, 9.0, 9.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010389089584350586, -0.0010055126622319221, -0.0009721163660287857, -0.0009387200698256493, -0.0009053237736225128, -0.0008719274774193764, -0.0008385311812162399, -0.0008051348850131035, -0.000771738588809967, -0.0007383422926068306, -0.0007049459964036942, -0.0006715497002005577, -0.0006381534039974213, -0.0006047571077942848, -0.0005713608115911484, -0.0005379645153880119, -0.0005045682191848755, -0.00047117192298173904, -0.0004377756267786026, -0.00040437933057546616, -0.0003709830343723297, -0.00033758673816919327, -0.0003041904419660568, -0.0002707941457629204, -0.00023739784955978394, -0.0002040015533566475, -0.00017060525715351105, -0.0001372089609503746, -0.00010381266474723816, -7.041636854410172e-05, -3.702007234096527e-05, -3.623776137828827e-06, 2.9772520065307617e-05, 6.316881626844406e-05, 9.65651124715805e-05, 0.00012996140867471695, 0.0001633577048778534, 0.00019675400108098984, 0.00023015029728412628, 0.0002635465934872627, 0.00029694288969039917, 0.0003303391858935356, 0.00036373548209667206, 0.0003971317782998085, 0.00043052807450294495, 0.0004639243707060814, 0.0004973206669092178, 0.0005307169631123543, 0.0005641132593154907, 0.0005975095555186272, 0.0006309058517217636, 0.0006643021479249001, 0.0006976984441280365, 0.0007310947403311729, 0.0007644910365343094, 0.0007978873327374458, 0.0008312836289405823, 0.0008646799251437187, 0.0008980762213468552, 0.0009314725175499916, 0.000964868813753128, 0.0009982651099562645, 0.001031661406159401, 0.0010650577023625374, 0.0010984539985656738]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 7.0, 7.0, 12.0, 11.0, 12.0, 12.0, 20.0, 22.0, 22.0, 28.0, 27.0, 33.0, 23.0, 35.0, 33.0, 26.0, 31.0, 35.0, 38.0, 50.0, 42.0, 36.0, 37.0, 34.0, 44.0, 34.0, 33.0, 37.0, 32.0, 24.0, 25.0, 17.0, 13.0, 20.0, 16.0, 12.0, 9.0, 11.0, 2.0, 10.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.515625, -7.27972412109375, -7.0438232421875, -6.80792236328125, -6.572021484375, -6.33612060546875, -6.1002197265625, -5.86431884765625, -5.62841796875, -5.39251708984375, -5.1566162109375, -4.92071533203125, -4.684814453125, -4.44891357421875, -4.2130126953125, -3.97711181640625, -3.7412109375, -3.50531005859375, -3.2694091796875, -3.03350830078125, -2.797607421875, -2.56170654296875, -2.3258056640625, -2.08990478515625, -1.85400390625, -1.61810302734375, -1.3822021484375, -1.14630126953125, -0.910400390625, -0.67449951171875, -0.4385986328125, -0.20269775390625, 0.033203125, 0.26910400390625, 0.5050048828125, 0.74090576171875, 0.976806640625, 1.21270751953125, 1.4486083984375, 1.68450927734375, 1.92041015625, 2.15631103515625, 2.3922119140625, 2.62811279296875, 2.864013671875, 3.09991455078125, 3.3358154296875, 3.57171630859375, 3.8076171875, 4.04351806640625, 4.2794189453125, 4.51531982421875, 4.751220703125, 4.98712158203125, 5.2230224609375, 5.45892333984375, 5.69482421875, 5.93072509765625, 6.1666259765625, 6.40252685546875, 6.638427734375, 6.87432861328125, 7.1102294921875, 7.34613037109375, 7.58203125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 11.0, 16.0, 13.0, 26.0, 30.0, 41.0, 60.0, 68.0, 86.0, 100.0, 155.0, 193.0, 260.0, 331.0, 477.0, 749.0, 1622.0, 4693.0, 17705.0, 90345.0, 746660.0, 149004.0, 24717.0, 6243.0, 2020.0, 857.0, 548.0, 379.0, 258.0, 209.0, 157.0, 113.0, 83.0, 81.0, 49.0, 45.0, 29.0, 25.0, 15.0, 11.0, 14.0, 8.0, 8.0, 5.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-18.546875, -17.960205078125, -17.37353515625, -16.786865234375, -16.2001953125, -15.613525390625, -15.02685546875, -14.440185546875, -13.853515625, -13.266845703125, -12.68017578125, -12.093505859375, -11.5068359375, -10.920166015625, -10.33349609375, -9.746826171875, -9.16015625, -8.573486328125, -7.98681640625, -7.400146484375, -6.8134765625, -6.226806640625, -5.64013671875, -5.053466796875, -4.466796875, -3.880126953125, -3.29345703125, -2.706787109375, -2.1201171875, -1.533447265625, -0.94677734375, -0.360107421875, 0.2265625, 0.813232421875, 1.39990234375, 1.986572265625, 2.5732421875, 3.159912109375, 3.74658203125, 4.333251953125, 4.919921875, 5.506591796875, 6.09326171875, 6.679931640625, 7.2666015625, 7.853271484375, 8.43994140625, 9.026611328125, 9.61328125, 10.199951171875, 10.78662109375, 11.373291015625, 11.9599609375, 12.546630859375, 13.13330078125, 13.719970703125, 14.306640625, 14.893310546875, 15.47998046875, 16.066650390625, 16.6533203125, 17.239990234375, 17.82666015625, 18.413330078125, 19.0]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 6.0, 2.0, 2.0, 3.0, 7.0, 13.0, 11.0, 14.0, 20.0, 30.0, 30.0, 25.0, 24.0, 27.0, 30.0, 42.0, 36.0, 47.0, 63.0, 89.0, 167.0, 1471.0, 330.0, 112.0, 63.0, 49.0, 40.0, 39.0, 36.0, 25.0, 38.0, 21.0, 23.0, 17.0, 17.0, 11.0, 15.0, 13.0, 9.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-22.265625, -21.564453125, -20.86328125, -20.162109375, -19.4609375, -18.759765625, -18.05859375, -17.357421875, -16.65625, -15.955078125, -15.25390625, -14.552734375, -13.8515625, -13.150390625, -12.44921875, -11.748046875, -11.046875, -10.345703125, -9.64453125, -8.943359375, -8.2421875, -7.541015625, -6.83984375, -6.138671875, -5.4375, -4.736328125, -4.03515625, -3.333984375, -2.6328125, -1.931640625, -1.23046875, -0.529296875, 0.171875, 0.873046875, 1.57421875, 2.275390625, 2.9765625, 3.677734375, 4.37890625, 5.080078125, 5.78125, 6.482421875, 7.18359375, 7.884765625, 8.5859375, 9.287109375, 9.98828125, 10.689453125, 11.390625, 12.091796875, 12.79296875, 13.494140625, 14.1953125, 14.896484375, 15.59765625, 16.298828125, 17.0, 17.701171875, 18.40234375, 19.103515625, 19.8046875, 20.505859375, 21.20703125, 21.908203125, 22.609375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 10.0, 6.0, 17.0, 19.0, 15.0, 17.0, 21.0, 39.0, 31.0, 55.0, 58.0, 90.0, 108.0, 218.0, 387.0, 1007.0, 4757.0, 287507.0, 2836732.0, 11690.0, 1527.0, 508.0, 257.0, 144.0, 98.0, 68.0, 57.0, 56.0, 47.0, 35.0, 26.0, 16.0, 21.0, 12.0, 6.0, 8.0, 3.0, 6.0, 8.0, 2.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.6875, -61.6435546875, -59.599609375, -57.5556640625, -55.51171875, -53.4677734375, -51.423828125, -49.3798828125, -47.3359375, -45.2919921875, -43.248046875, -41.2041015625, -39.16015625, -37.1162109375, -35.072265625, -33.0283203125, -30.984375, -28.9404296875, -26.896484375, -24.8525390625, -22.80859375, -20.7646484375, -18.720703125, -16.6767578125, -14.6328125, -12.5888671875, -10.544921875, -8.5009765625, -6.45703125, -4.4130859375, -2.369140625, -0.3251953125, 1.71875, 3.7626953125, 5.806640625, 7.8505859375, 9.89453125, 11.9384765625, 13.982421875, 16.0263671875, 18.0703125, 20.1142578125, 22.158203125, 24.2021484375, 26.24609375, 28.2900390625, 30.333984375, 32.3779296875, 34.421875, 36.4658203125, 38.509765625, 40.5537109375, 42.59765625, 44.6416015625, 46.685546875, 48.7294921875, 50.7734375, 52.8173828125, 54.861328125, 56.9052734375, 58.94921875, 60.9931640625, 63.037109375, 65.0810546875, 67.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 10.0, 123.0, 336.0, 375.0, 139.0, 26.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.370925903320312, -17.832563400268555, -14.29420280456543, -10.755840301513672, -7.2174787521362305, -3.679117202758789, -0.14075469970703125, 3.3976058959960938, 6.935968399047852, 10.474329948425293, 14.012691497802734, 17.551054000854492, 21.08941650390625, 24.627777099609375, 28.166139602661133, 31.704500198364258, 35.242862701416016, 38.78122329711914, 42.31958770751953, 45.857948303222656, 49.39630889892578, 52.934669494628906, 56.4730339050293, 60.01139450073242, 63.54975891113281, 67.08811950683594, 70.62648010253906, 74.16484069824219, 77.70320892333984, 81.24156951904297, 84.7799301147461, 88.31829071044922, 91.85665130615234, 95.39501190185547, 98.9333724975586, 102.47174072265625, 106.01010131835938, 109.5484619140625, 113.08682250976562, 116.62518310546875, 120.16354370117188, 123.701904296875, 127.24026489257812, 130.77862548828125, 134.31698608398438, 137.8553466796875, 141.39370727539062, 144.93206787109375, 148.47044372558594, 152.00880432128906, 155.5471649169922, 159.0855255126953, 162.62388610839844, 166.16224670410156, 169.70062255859375, 173.23898315429688, 176.77732849121094, 180.31568908691406, 183.8540496826172, 187.3924102783203, 190.93077087402344, 194.46913146972656, 198.00750732421875, 201.54586791992188, 205.084228515625]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 2.0, 6.0, 13.0, 8.0, 14.0, 12.0, 13.0, 12.0, 17.0, 22.0, 14.0, 22.0, 25.0, 40.0, 37.0, 21.0, 26.0, 21.0, 39.0, 38.0, 40.0, 39.0, 35.0, 47.0, 47.0, 32.0, 33.0, 26.0, 34.0, 31.0, 36.0, 26.0, 31.0, 23.0, 10.0, 19.0, 15.0, 12.0, 13.0, 10.0, 7.0, 7.0, 4.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-61.70460510253906, -59.826332092285156, -57.948062896728516, -56.06978988647461, -54.1915168762207, -52.31324768066406, -50.434974670410156, -48.55670166015625, -46.678428649902344, -44.80015563964844, -42.9218864440918, -41.04361343383789, -39.165340423583984, -37.287071228027344, -35.40879821777344, -33.53052520751953, -31.65225601196289, -29.773984909057617, -27.89571189880371, -26.017440795898438, -24.13916778564453, -22.260896682739258, -20.382625579833984, -18.504352569580078, -16.626081466674805, -14.747809410095215, -12.869537353515625, -10.991266250610352, -9.112994194030762, -7.234722137451172, -5.356451034545898, -3.4781789779663086, -1.5999031066894531, 0.2783687114715576, 2.1566405296325684, 4.034912109375, 5.91318416595459, 7.79145622253418, 9.669727325439453, 11.547999382019043, 13.426271438598633, 15.304543495178223, 17.182815551757812, 19.061086654663086, 20.93935775756836, 22.817630767822266, 24.69590187072754, 26.574172973632812, 28.45244598388672, 30.330717086791992, 32.208988189697266, 34.08726119995117, 35.96553421020508, 37.84380340576172, 39.722076416015625, 41.60034942626953, 43.47862243652344, 45.356895446777344, 47.235164642333984, 49.11343765258789, 50.9917106628418, 52.86997985839844, 54.748252868652344, 56.62652587890625, 58.50479507446289]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 4.0, 3.0, 6.0, 10.0, 11.0, 10.0, 13.0, 13.0, 22.0, 19.0, 26.0, 30.0, 26.0, 25.0, 25.0, 27.0, 31.0, 31.0, 41.0, 52.0, 40.0, 36.0, 46.0, 40.0, 38.0, 39.0, 40.0, 40.0, 36.0, 19.0, 23.0, 20.0, 14.0, 27.0, 19.0, 15.0, 15.0, 10.0, 11.0, 5.0, 8.0, 7.0, 3.0, 7.0, 0.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.15625, -7.9111328125, -7.666015625, -7.4208984375, -7.17578125, -6.9306640625, -6.685546875, -6.4404296875, -6.1953125, -5.9501953125, -5.705078125, -5.4599609375, -5.21484375, -4.9697265625, -4.724609375, -4.4794921875, -4.234375, -3.9892578125, -3.744140625, -3.4990234375, -3.25390625, -3.0087890625, -2.763671875, -2.5185546875, -2.2734375, -2.0283203125, -1.783203125, -1.5380859375, -1.29296875, -1.0478515625, -0.802734375, -0.5576171875, -0.3125, -0.0673828125, 0.177734375, 0.4228515625, 0.66796875, 0.9130859375, 1.158203125, 1.4033203125, 1.6484375, 1.8935546875, 2.138671875, 2.3837890625, 2.62890625, 2.8740234375, 3.119140625, 3.3642578125, 3.609375, 3.8544921875, 4.099609375, 4.3447265625, 4.58984375, 4.8349609375, 5.080078125, 5.3251953125, 5.5703125, 5.8154296875, 6.060546875, 6.3056640625, 6.55078125, 6.7958984375, 7.041015625, 7.2861328125, 7.53125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 9.0, 9.0, 15.0, 18.0, 12.0, 24.0, 27.0, 38.0, 43.0, 59.0, 77.0, 108.0, 147.0, 201.0, 326.0, 588.0, 1486.0, 5421.0, 28072.0, 199086.0, 1166425.0, 2041192.0, 635678.0, 95540.0, 14250.0, 3019.0, 977.0, 441.0, 272.0, 185.0, 123.0, 93.0, 57.0, 48.0, 49.0, 43.0, 19.0, 25.0, 22.0, 9.0, 12.0, 10.0, 8.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.9375, -13.506103515625, -13.07470703125, -12.643310546875, -12.2119140625, -11.780517578125, -11.34912109375, -10.917724609375, -10.486328125, -10.054931640625, -9.62353515625, -9.192138671875, -8.7607421875, -8.329345703125, -7.89794921875, -7.466552734375, -7.03515625, -6.603759765625, -6.17236328125, -5.740966796875, -5.3095703125, -4.878173828125, -4.44677734375, -4.015380859375, -3.583984375, -3.152587890625, -2.72119140625, -2.289794921875, -1.8583984375, -1.427001953125, -0.99560546875, -0.564208984375, -0.1328125, 0.298583984375, 0.72998046875, 1.161376953125, 1.5927734375, 2.024169921875, 2.45556640625, 2.886962890625, 3.318359375, 3.749755859375, 4.18115234375, 4.612548828125, 5.0439453125, 5.475341796875, 5.90673828125, 6.338134765625, 6.76953125, 7.200927734375, 7.63232421875, 8.063720703125, 8.4951171875, 8.926513671875, 9.35791015625, 9.789306640625, 10.220703125, 10.652099609375, 11.08349609375, 11.514892578125, 11.9462890625, 12.377685546875, 12.80908203125, 13.240478515625, 13.671875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 1.0, 4.0, 2.0, 6.0, 6.0, 5.0, 12.0, 6.0, 12.0, 29.0, 33.0, 38.0, 56.0, 75.0, 102.0, 122.0, 176.0, 201.0, 283.0, 324.0, 379.0, 396.0, 379.0, 329.0, 261.0, 201.0, 164.0, 121.0, 79.0, 65.0, 49.0, 27.0, 31.0, 12.0, 17.0, 14.0, 11.0, 9.0, 15.0, 5.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0], "bins": [-13.90625, -13.5343017578125, -13.162353515625, -12.7904052734375, -12.41845703125, -12.0465087890625, -11.674560546875, -11.3026123046875, -10.9306640625, -10.5587158203125, -10.186767578125, -9.8148193359375, -9.44287109375, -9.0709228515625, -8.698974609375, -8.3270263671875, -7.955078125, -7.5831298828125, -7.211181640625, -6.8392333984375, -6.46728515625, -6.0953369140625, -5.723388671875, -5.3514404296875, -4.9794921875, -4.6075439453125, -4.235595703125, -3.8636474609375, -3.49169921875, -3.1197509765625, -2.747802734375, -2.3758544921875, -2.00390625, -1.6319580078125, -1.260009765625, -0.8880615234375, -0.51611328125, -0.1441650390625, 0.227783203125, 0.5997314453125, 0.9716796875, 1.3436279296875, 1.715576171875, 2.0875244140625, 2.45947265625, 2.8314208984375, 3.203369140625, 3.5753173828125, 3.947265625, 4.3192138671875, 4.691162109375, 5.0631103515625, 5.43505859375, 5.8070068359375, 6.178955078125, 6.5509033203125, 6.9228515625, 7.2947998046875, 7.666748046875, 8.0386962890625, 8.41064453125, 8.7825927734375, 9.154541015625, 9.5264892578125, 9.8984375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 6.0, 14.0, 12.0, 24.0, 20.0, 28.0, 35.0, 46.0, 57.0, 96.0, 129.0, 236.0, 319.0, 488.0, 863.0, 2073.0, 7647.0, 61020.0, 1181013.0, 2760357.0, 158765.0, 15047.0, 3119.0, 1146.0, 561.0, 349.0, 204.0, 184.0, 126.0, 68.0, 52.0, 44.0, 24.0, 20.0, 17.0, 19.0, 12.0, 9.0, 6.0, 2.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.296875, -24.399169921875, -23.50146484375, -22.603759765625, -21.7060546875, -20.808349609375, -19.91064453125, -19.012939453125, -18.115234375, -17.217529296875, -16.31982421875, -15.422119140625, -14.5244140625, -13.626708984375, -12.72900390625, -11.831298828125, -10.93359375, -10.035888671875, -9.13818359375, -8.240478515625, -7.3427734375, -6.445068359375, -5.54736328125, -4.649658203125, -3.751953125, -2.854248046875, -1.95654296875, -1.058837890625, -0.1611328125, 0.736572265625, 1.63427734375, 2.531982421875, 3.4296875, 4.327392578125, 5.22509765625, 6.122802734375, 7.0205078125, 7.918212890625, 8.81591796875, 9.713623046875, 10.611328125, 11.509033203125, 12.40673828125, 13.304443359375, 14.2021484375, 15.099853515625, 15.99755859375, 16.895263671875, 17.79296875, 18.690673828125, 19.58837890625, 20.486083984375, 21.3837890625, 22.281494140625, 23.17919921875, 24.076904296875, 24.974609375, 25.872314453125, 26.77001953125, 27.667724609375, 28.5654296875, 29.463134765625, 30.36083984375, 31.258544921875, 32.15625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 24.0, 431.0, 517.0, 42.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-195.6342010498047, -184.1607208251953, -172.68724060058594, -161.21376037597656, -149.7402801513672, -138.2667999267578, -126.79332733154297, -115.3198471069336, -103.84636688232422, -92.37288665771484, -80.89940643310547, -69.42593383789062, -57.952449798583984, -46.47896957397461, -35.0054931640625, -23.532012939453125, -12.05853271484375, -0.5850534439086914, 10.888425827026367, 22.36190414428711, 33.835384368896484, 45.30886459350586, 56.78234100341797, 68.25582122802734, 79.72930145263672, 91.2027816772461, 102.67626190185547, 114.14973449707031, 125.62321472167969, 137.09669494628906, 148.57017517089844, 160.0436553955078, 171.51712036132812, 182.9906005859375, 194.46408081054688, 205.93756103515625, 217.41104125976562, 228.884521484375, 240.35800170898438, 251.83148193359375, 263.3049621582031, 274.7784423828125, 286.2519226074219, 297.72540283203125, 309.1988830566406, 320.67236328125, 332.1458435058594, 343.61932373046875, 355.0927734375, 366.5662536621094, 378.03973388671875, 389.5132141113281, 400.9866943359375, 412.4601745605469, 423.93365478515625, 435.4071350097656, 446.880615234375, 458.3540954589844, 469.82757568359375, 481.3010559082031, 492.7745361328125, 504.2480163574219, 515.7214965820312, 527.1949462890625, 538.66845703125]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 4.0, 11.0, 10.0, 11.0, 15.0, 18.0, 22.0, 22.0, 21.0, 38.0, 31.0, 25.0, 31.0, 40.0, 32.0, 45.0, 37.0, 32.0, 50.0, 52.0, 45.0, 48.0, 35.0, 40.0, 24.0, 23.0, 26.0, 23.0, 21.0, 25.0, 24.0, 18.0, 13.0, 16.0, 5.0, 9.0, 13.0, 6.0, 6.0, 9.0, 2.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-44.03077697753906, -42.614967346191406, -41.199153900146484, -39.78334426879883, -38.367530822753906, -36.95172119140625, -35.535911560058594, -34.12009811401367, -32.704288482666016, -31.288476943969727, -29.872665405273438, -28.45685577392578, -27.041044235229492, -25.625232696533203, -24.209421157836914, -22.793609619140625, -21.377798080444336, -19.961986541748047, -18.546175003051758, -17.13036346435547, -15.714553833007812, -14.298742294311523, -12.882930755615234, -11.467120170593262, -10.051308631896973, -8.635497093200684, -7.219686508178711, -5.803874969482422, -4.388063907623291, -2.97225284576416, -1.556441307067871, -0.14063072204589844, 1.2751808166503906, 2.6909918785095215, 4.106802940368652, 5.522614479064941, 6.938425540924072, 8.354236602783203, 9.770048141479492, 11.185858726501465, 12.601670265197754, 14.017481803894043, 15.433292388916016, 16.849103927612305, 18.264915466308594, 19.68072509765625, 21.096538543701172, 22.512348175048828, 23.928159713745117, 25.343971252441406, 26.759782791137695, 28.175594329833984, 29.59140396118164, 31.00721549987793, 32.42302703857422, 33.838836669921875, 35.2546501159668, 36.67045974731445, 38.086273193359375, 39.50208282470703, 40.91789627075195, 42.33370590209961, 43.74951934814453, 45.16532897949219, 46.581138610839844]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 11.0, 5.0, 11.0, 7.0, 8.0, 10.0, 20.0, 14.0, 17.0, 15.0, 21.0, 15.0, 33.0, 28.0, 32.0, 31.0, 40.0, 31.0, 34.0, 41.0, 34.0, 43.0, 56.0, 32.0, 51.0, 38.0, 32.0, 39.0, 37.0, 24.0, 24.0, 21.0, 19.0, 18.0, 21.0, 16.0, 13.0, 7.0, 9.0, 4.0, 11.0, 11.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.9569091796875, -7.695068359375, -7.4332275390625, -7.17138671875, -6.9095458984375, -6.647705078125, -6.3858642578125, -6.1240234375, -5.8621826171875, -5.600341796875, -5.3385009765625, -5.07666015625, -4.8148193359375, -4.552978515625, -4.2911376953125, -4.029296875, -3.7674560546875, -3.505615234375, -3.2437744140625, -2.98193359375, -2.7200927734375, -2.458251953125, -2.1964111328125, -1.9345703125, -1.6727294921875, -1.410888671875, -1.1490478515625, -0.88720703125, -0.6253662109375, -0.363525390625, -0.1016845703125, 0.16015625, 0.4219970703125, 0.683837890625, 0.9456787109375, 1.20751953125, 1.4693603515625, 1.731201171875, 1.9930419921875, 2.2548828125, 2.5167236328125, 2.778564453125, 3.0404052734375, 3.30224609375, 3.5640869140625, 3.825927734375, 4.0877685546875, 4.349609375, 4.6114501953125, 4.873291015625, 5.1351318359375, 5.39697265625, 5.6588134765625, 5.920654296875, 6.1824951171875, 6.4443359375, 6.7061767578125, 6.968017578125, 7.2298583984375, 7.49169921875, 7.7535400390625, 8.015380859375, 8.2772216796875, 8.5390625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 6.0, 17.0, 11.0, 26.0, 27.0, 52.0, 67.0, 107.0, 147.0, 196.0, 293.0, 400.0, 587.0, 815.0, 1229.0, 1785.0, 2461.0, 3661.0, 5341.0, 7575.0, 11142.0, 16510.0, 24790.0, 36164.0, 54750.0, 83097.0, 122764.0, 164017.0, 159570.0, 115008.0, 78567.0, 51290.0, 33990.0, 23003.0, 15495.0, 10526.0, 7181.0, 4928.0, 3361.0, 2339.0, 1594.0, 1099.0, 708.0, 551.0, 397.0, 279.0, 193.0, 147.0, 84.0, 74.0, 43.0, 34.0, 25.0, 7.0, 14.0, 7.0, 9.0, 3.0, 3.0, 2.0], "bins": [-0.5625, -0.5448760986328125, -0.527252197265625, -0.5096282958984375, -0.49200439453125, -0.4743804931640625, -0.456756591796875, -0.4391326904296875, -0.4215087890625, -0.4038848876953125, -0.386260986328125, -0.3686370849609375, -0.35101318359375, -0.3333892822265625, -0.315765380859375, -0.2981414794921875, -0.280517578125, -0.2628936767578125, -0.245269775390625, -0.2276458740234375, -0.21002197265625, -0.1923980712890625, -0.174774169921875, -0.1571502685546875, -0.1395263671875, -0.1219024658203125, -0.104278564453125, -0.0866546630859375, -0.06903076171875, -0.0514068603515625, -0.033782958984375, -0.0161590576171875, 0.00146484375, 0.0190887451171875, 0.036712646484375, 0.0543365478515625, 0.07196044921875, 0.0895843505859375, 0.107208251953125, 0.1248321533203125, 0.1424560546875, 0.1600799560546875, 0.177703857421875, 0.1953277587890625, 0.21295166015625, 0.2305755615234375, 0.248199462890625, 0.2658233642578125, 0.283447265625, 0.3010711669921875, 0.318695068359375, 0.3363189697265625, 0.35394287109375, 0.3715667724609375, 0.389190673828125, 0.4068145751953125, 0.4244384765625, 0.4420623779296875, 0.459686279296875, 0.4773101806640625, 0.49493408203125, 0.5125579833984375, 0.530181884765625, 0.5478057861328125, 0.5654296875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 6.0, 8.0, 14.0, 8.0, 18.0, 14.0, 17.0, 25.0, 18.0, 26.0, 18.0, 28.0, 26.0, 32.0, 34.0, 30.0, 53.0, 38.0, 51.0, 1056.0, 26.0, 51.0, 42.0, 43.0, 41.0, 47.0, 24.0, 23.0, 25.0, 27.0, 22.0, 15.0, 16.0, 24.0, 11.0, 11.0, 10.0, 5.0, 4.0, 12.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-5.6484375, -5.4747314453125, -5.301025390625, -5.1273193359375, -4.95361328125, -4.7799072265625, -4.606201171875, -4.4324951171875, -4.2587890625, -4.0850830078125, -3.911376953125, -3.7376708984375, -3.56396484375, -3.3902587890625, -3.216552734375, -3.0428466796875, -2.869140625, -2.6954345703125, -2.521728515625, -2.3480224609375, -2.17431640625, -2.0006103515625, -1.826904296875, -1.6531982421875, -1.4794921875, -1.3057861328125, -1.132080078125, -0.9583740234375, -0.78466796875, -0.6109619140625, -0.437255859375, -0.2635498046875, -0.08984375, 0.0838623046875, 0.257568359375, 0.4312744140625, 0.60498046875, 0.7786865234375, 0.952392578125, 1.1260986328125, 1.2998046875, 1.4735107421875, 1.647216796875, 1.8209228515625, 1.99462890625, 2.1683349609375, 2.342041015625, 2.5157470703125, 2.689453125, 2.8631591796875, 3.036865234375, 3.2105712890625, 3.38427734375, 3.5579833984375, 3.731689453125, 3.9053955078125, 4.0791015625, 4.2528076171875, 4.426513671875, 4.6002197265625, 4.77392578125, 4.9476318359375, 5.121337890625, 5.2950439453125, 5.46875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 13.0, 5.0, 15.0, 28.0, 43.0, 73.0, 94.0, 169.0, 251.0, 376.0, 583.0, 857.0, 1381.0, 2198.0, 3439.0, 5049.0, 7791.0, 11650.0, 17835.0, 27090.0, 41204.0, 62391.0, 93849.0, 135115.0, 1214260.0, 150141.0, 108094.0, 72697.0, 47992.0, 31768.0, 20714.0, 14028.0, 8940.0, 6004.0, 3867.0, 2552.0, 1646.0, 1016.0, 721.0, 411.0, 277.0, 196.0, 122.0, 78.0, 43.0, 25.0, 14.0, 13.0, 3.0, 9.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.56591796875, -0.5491180419921875, -0.532318115234375, -0.5155181884765625, -0.49871826171875, -0.4819183349609375, -0.465118408203125, -0.4483184814453125, -0.4315185546875, -0.4147186279296875, -0.397918701171875, -0.3811187744140625, -0.36431884765625, -0.3475189208984375, -0.330718994140625, -0.3139190673828125, -0.297119140625, -0.2803192138671875, -0.263519287109375, -0.2467193603515625, -0.22991943359375, -0.2131195068359375, -0.196319580078125, -0.1795196533203125, -0.1627197265625, -0.1459197998046875, -0.129119873046875, -0.1123199462890625, -0.09552001953125, -0.0787200927734375, -0.061920166015625, -0.0451202392578125, -0.0283203125, -0.0115203857421875, 0.005279541015625, 0.0220794677734375, 0.03887939453125, 0.0556793212890625, 0.072479248046875, 0.0892791748046875, 0.1060791015625, 0.1228790283203125, 0.139678955078125, 0.1564788818359375, 0.17327880859375, 0.1900787353515625, 0.206878662109375, 0.2236785888671875, 0.240478515625, 0.2572784423828125, 0.274078369140625, 0.2908782958984375, 0.30767822265625, 0.3244781494140625, 0.341278076171875, 0.3580780029296875, 0.3748779296875, 0.3916778564453125, 0.408477783203125, 0.4252777099609375, 0.44207763671875, 0.4588775634765625, 0.475677490234375, 0.4924774169921875, 0.50927734375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 3.0, 9.0, 17.0, 14.0, 24.0, 27.0, 36.0, 41.0, 49.0, 62.0, 65.0, 74.0, 73.0, 69.0, 67.0, 65.0, 65.0, 49.0, 40.0, 31.0, 25.0, 13.0, 19.0, 11.0, 8.0, 7.0, 6.0, 7.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025463104248046875, -0.0024728775024414062, -0.002399444580078125, -0.0023260116577148438, -0.0022525787353515625, -0.0021791458129882812, -0.002105712890625, -0.0020322799682617188, -0.0019588470458984375, -0.0018854141235351562, -0.001811981201171875, -0.0017385482788085938, -0.0016651153564453125, -0.0015916824340820312, -0.00151824951171875, -0.0014448165893554688, -0.0013713836669921875, -0.0012979507446289062, -0.001224517822265625, -0.0011510848999023438, -0.0010776519775390625, -0.0010042190551757812, -0.0009307861328125, -0.0008573532104492188, -0.0007839202880859375, -0.0007104873657226562, -0.000637054443359375, -0.0005636215209960938, -0.0004901885986328125, -0.00041675567626953125, -0.00034332275390625, -0.00026988983154296875, -0.0001964569091796875, -0.00012302398681640625, -4.9591064453125e-05, 2.384185791015625e-05, 9.72747802734375e-05, 0.00017070770263671875, 0.000244140625, 0.00031757354736328125, 0.0003910064697265625, 0.00046443939208984375, 0.000537872314453125, 0.0006113052368164062, 0.0006847381591796875, 0.0007581710815429688, 0.00083160400390625, 0.0009050369262695312, 0.0009784698486328125, 0.0010519027709960938, 0.001125335693359375, 0.0011987686157226562, 0.0012722015380859375, 0.0013456344604492188, 0.0014190673828125, 0.0014925003051757812, 0.0015659332275390625, 0.0016393661499023438, 0.001712799072265625, 0.0017862319946289062, 0.0018596649169921875, 0.0019330978393554688, 0.00200653076171875, 0.0020799636840820312, 0.0021533966064453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 12.0, 15.0, 14.0, 16.0, 21.0, 42.0, 37.0, 55.0, 74.0, 123.0, 153.0, 325.0, 527.0, 1259.0, 524889.0, 518363.0, 1244.0, 527.0, 276.0, 156.0, 120.0, 84.0, 55.0, 41.0, 34.0, 17.0, 14.0, 13.0, 12.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.042083740234375, -0.040680885314941406, -0.03927803039550781, -0.03787517547607422, -0.036472320556640625, -0.03506946563720703, -0.03366661071777344, -0.032263755798339844, -0.03086090087890625, -0.029458045959472656, -0.028055191040039062, -0.02665233612060547, -0.025249481201171875, -0.02384662628173828, -0.022443771362304688, -0.021040916442871094, -0.0196380615234375, -0.018235206604003906, -0.016832351684570312, -0.015429496765136719, -0.014026641845703125, -0.012623786926269531, -0.011220932006835938, -0.009818077087402344, -0.00841522216796875, -0.007012367248535156, -0.0056095123291015625, -0.004206657409667969, -0.002803802490234375, -0.0014009475708007812, 1.9073486328125e-06, 0.0014047622680664062, 0.0028076171875, 0.004210472106933594, 0.0056133270263671875, 0.007016181945800781, 0.008419036865234375, 0.009821891784667969, 0.011224746704101562, 0.012627601623535156, 0.01403045654296875, 0.015433311462402344, 0.016836166381835938, 0.01823902130126953, 0.019641876220703125, 0.02104473114013672, 0.022447586059570312, 0.023850440979003906, 0.0252532958984375, 0.026656150817871094, 0.028059005737304688, 0.02946186065673828, 0.030864715576171875, 0.03226757049560547, 0.03367042541503906, 0.035073280334472656, 0.03647613525390625, 0.037878990173339844, 0.03928184509277344, 0.04068470001220703, 0.042087554931640625, 0.04349040985107422, 0.04489326477050781, 0.046296119689941406, 0.047698974609375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 19.0, 523.0, 454.0, 20.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012449084781110287, -0.012172176502645016, -0.01189526915550232, -0.011618360877037048, -0.011341452598571777, -0.011064544320106506, -0.01078763697296381, -0.010510728694498539, -0.010233820416033268, -0.009956912137567997, -0.0096800047904253, -0.00940309651196003, -0.009126188233494759, -0.008849279955029488, -0.008572372607886791, -0.00829546432942152, -0.008018556982278824, -0.00774164916947484, -0.007464740891009569, -0.0071878330782055855, -0.0069109247997403145, -0.006634016986936331, -0.006357109174132347, -0.006080200895667076, -0.005803292617201805, -0.005526384804397821, -0.00524947652593255, -0.004972568713128567, -0.004695660434663296, -0.004418752621859312, -0.004141844809055328, -0.0038649365305900574, -0.0035880282521247864, -0.003311120206490159, -0.0030342121608555317, -0.002757304348051548, -0.002480396069586277, -0.0022034882567822933, -0.001926580211147666, -0.0016496721655130386, -0.0013727641198784113, -0.001095856074243784, -0.0008189480868168175, -0.0005420400993898511, -0.00026513205375522375, 1.1775991879403591e-05, 0.0002886839210987091, 0.0005655919667333364, 0.0008425000123679638, 0.0011194080580025911, 0.0013963161036372185, 0.001673224032856524, 0.0019501320784911513, 0.002227040007710457, 0.002503948053345084, 0.0027808560989797115, 0.003057764144614339, 0.0033346721902489662, 0.0036115802358835936, 0.003888488281518221, 0.004165396094322205, 0.004442304372787476, 0.004719212185591459, 0.004996119998395443, 0.005273028276860714]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 9.0, 3.0, 7.0, 5.0, 19.0, 14.0, 17.0, 15.0, 21.0, 24.0, 21.0, 28.0, 27.0, 32.0, 33.0, 38.0, 40.0, 47.0, 33.0, 48.0, 38.0, 29.0, 47.0, 37.0, 27.0, 36.0, 30.0, 39.0, 29.0, 23.0, 23.0, 22.0, 21.0, 23.0, 20.0, 13.0, 9.0, 10.0, 8.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008704066276550293, -0.0008399803191423416, -0.0008095540106296539, -0.0007791277021169662, -0.0007487013936042786, -0.0007182750850915909, -0.0006878487765789032, -0.0006574224680662155, -0.0006269961595535278, -0.0005965698510408401, -0.0005661435425281525, -0.0005357172340154648, -0.0005052909255027771, -0.0004748646169900894, -0.00044443830847740173, -0.00041401199996471405, -0.00038358569145202637, -0.0003531593829393387, -0.000322733074426651, -0.0002923067659139633, -0.00026188045740127563, -0.00023145414888858795, -0.00020102784037590027, -0.00017060153186321259, -0.0001401752233505249, -0.00010974891483783722, -7.932260632514954e-05, -4.889629781246185e-05, -1.846998929977417e-05, 1.1956319212913513e-05, 4.2382627725601196e-05, 7.280893623828888e-05, 0.00010323524475097656, 0.00013366155326366425, 0.00016408786177635193, 0.0001945141702890396, 0.0002249404788017273, 0.000255366787314415, 0.00028579309582710266, 0.00031621940433979034, 0.00034664571285247803, 0.0003770720213651657, 0.0004074983298778534, 0.0004379246383905411, 0.00046835094690322876, 0.0004987772554159164, 0.0005292035639286041, 0.0005596298724412918, 0.0005900561809539795, 0.0006204824894666672, 0.0006509087979793549, 0.0006813351064920425, 0.0007117614150047302, 0.0007421877235174179, 0.0007726140320301056, 0.0008030403405427933, 0.000833466649055481, 0.0008638929575681686, 0.0008943192660808563, 0.000924745574593544, 0.0009551718831062317, 0.0009855981916189194, 0.001016024500131607, 0.0010464508086442947, 0.0010768771171569824]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 11.0, 5.0, 11.0, 7.0, 8.0, 10.0, 20.0, 14.0, 17.0, 15.0, 21.0, 15.0, 33.0, 28.0, 32.0, 31.0, 40.0, 31.0, 34.0, 41.0, 34.0, 43.0, 56.0, 32.0, 51.0, 38.0, 32.0, 39.0, 37.0, 24.0, 24.0, 21.0, 19.0, 18.0, 21.0, 16.0, 13.0, 7.0, 9.0, 4.0, 11.0, 11.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.9569091796875, -7.695068359375, -7.4332275390625, -7.17138671875, -6.9095458984375, -6.647705078125, -6.3858642578125, -6.1240234375, -5.8621826171875, -5.600341796875, -5.3385009765625, -5.07666015625, -4.8148193359375, -4.552978515625, -4.2911376953125, -4.029296875, -3.7674560546875, -3.505615234375, -3.2437744140625, -2.98193359375, -2.7200927734375, -2.458251953125, -2.1964111328125, -1.9345703125, -1.6727294921875, -1.410888671875, -1.1490478515625, -0.88720703125, -0.6253662109375, -0.363525390625, -0.1016845703125, 0.16015625, 0.4219970703125, 0.683837890625, 0.9456787109375, 1.20751953125, 1.4693603515625, 1.731201171875, 1.9930419921875, 2.2548828125, 2.5167236328125, 2.778564453125, 3.0404052734375, 3.30224609375, 3.5640869140625, 3.825927734375, 4.0877685546875, 4.349609375, 4.6114501953125, 4.873291015625, 5.1351318359375, 5.39697265625, 5.6588134765625, 5.920654296875, 6.1824951171875, 6.4443359375, 6.7061767578125, 6.968017578125, 7.2298583984375, 7.49169921875, 7.7535400390625, 8.015380859375, 8.2772216796875, 8.5390625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 7.0, 3.0, 3.0, 3.0, 9.0, 13.0, 22.0, 17.0, 21.0, 30.0, 39.0, 53.0, 78.0, 99.0, 114.0, 156.0, 219.0, 374.0, 556.0, 1022.0, 1895.0, 3654.0, 8033.0, 18170.0, 44583.0, 110293.0, 289500.0, 342203.0, 133107.0, 53510.0, 22070.0, 9090.0, 4304.0, 2187.0, 1121.0, 662.0, 370.0, 256.0, 187.0, 139.0, 115.0, 63.0, 50.0, 45.0, 40.0, 23.0, 16.0, 12.0, 9.0, 13.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2734375, -9.943115234375, -9.61279296875, -9.282470703125, -8.9521484375, -8.621826171875, -8.29150390625, -7.961181640625, -7.630859375, -7.300537109375, -6.97021484375, -6.639892578125, -6.3095703125, -5.979248046875, -5.64892578125, -5.318603515625, -4.98828125, -4.657958984375, -4.32763671875, -3.997314453125, -3.6669921875, -3.336669921875, -3.00634765625, -2.676025390625, -2.345703125, -2.015380859375, -1.68505859375, -1.354736328125, -1.0244140625, -0.694091796875, -0.36376953125, -0.033447265625, 0.296875, 0.627197265625, 0.95751953125, 1.287841796875, 1.6181640625, 1.948486328125, 2.27880859375, 2.609130859375, 2.939453125, 3.269775390625, 3.60009765625, 3.930419921875, 4.2607421875, 4.591064453125, 4.92138671875, 5.251708984375, 5.58203125, 5.912353515625, 6.24267578125, 6.572998046875, 6.9033203125, 7.233642578125, 7.56396484375, 7.894287109375, 8.224609375, 8.554931640625, 8.88525390625, 9.215576171875, 9.5458984375, 9.876220703125, 10.20654296875, 10.536865234375, 10.8671875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 3.0, 6.0, 8.0, 7.0, 9.0, 12.0, 11.0, 8.0, 19.0, 11.0, 25.0, 29.0, 37.0, 30.0, 40.0, 40.0, 64.0, 80.0, 112.0, 181.0, 1427.0, 252.0, 126.0, 87.0, 56.0, 38.0, 55.0, 32.0, 27.0, 20.0, 33.0, 19.0, 21.0, 20.0, 21.0, 19.0, 6.0, 10.0, 4.0, 11.0, 2.0, 6.0, 3.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.703125, -22.931640625, -22.16015625, -21.388671875, -20.6171875, -19.845703125, -19.07421875, -18.302734375, -17.53125, -16.759765625, -15.98828125, -15.216796875, -14.4453125, -13.673828125, -12.90234375, -12.130859375, -11.359375, -10.587890625, -9.81640625, -9.044921875, -8.2734375, -7.501953125, -6.73046875, -5.958984375, -5.1875, -4.416015625, -3.64453125, -2.873046875, -2.1015625, -1.330078125, -0.55859375, 0.212890625, 0.984375, 1.755859375, 2.52734375, 3.298828125, 4.0703125, 4.841796875, 5.61328125, 6.384765625, 7.15625, 7.927734375, 8.69921875, 9.470703125, 10.2421875, 11.013671875, 11.78515625, 12.556640625, 13.328125, 14.099609375, 14.87109375, 15.642578125, 16.4140625, 17.185546875, 17.95703125, 18.728515625, 19.5, 20.271484375, 21.04296875, 21.814453125, 22.5859375, 23.357421875, 24.12890625, 24.900390625, 25.671875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 9.0, 7.0, 13.0, 11.0, 20.0, 19.0, 28.0, 41.0, 62.0, 75.0, 141.0, 195.0, 308.0, 482.0, 1052.0, 7838.0, 466865.0, 2641512.0, 23829.0, 1635.0, 537.0, 333.0, 208.0, 127.0, 100.0, 67.0, 47.0, 39.0, 29.0, 15.0, 9.0, 13.0, 8.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-60.59375, -58.81982421875, -57.0458984375, -55.27197265625, -53.498046875, -51.72412109375, -49.9501953125, -48.17626953125, -46.40234375, -44.62841796875, -42.8544921875, -41.08056640625, -39.306640625, -37.53271484375, -35.7587890625, -33.98486328125, -32.2109375, -30.43701171875, -28.6630859375, -26.88916015625, -25.115234375, -23.34130859375, -21.5673828125, -19.79345703125, -18.01953125, -16.24560546875, -14.4716796875, -12.69775390625, -10.923828125, -9.14990234375, -7.3759765625, -5.60205078125, -3.828125, -2.05419921875, -0.2802734375, 1.49365234375, 3.267578125, 5.04150390625, 6.8154296875, 8.58935546875, 10.36328125, 12.13720703125, 13.9111328125, 15.68505859375, 17.458984375, 19.23291015625, 21.0068359375, 22.78076171875, 24.5546875, 26.32861328125, 28.1025390625, 29.87646484375, 31.650390625, 33.42431640625, 35.1982421875, 36.97216796875, 38.74609375, 40.52001953125, 42.2939453125, 44.06787109375, 45.841796875, 47.61572265625, 49.3896484375, 51.16357421875, 52.9375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [20.0, 179.0, 452.0, 308.0, 48.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.707290649414062, -8.592103958129883, -3.476917266845703, 1.6382694244384766, 6.753456115722656, 11.868642807006836, 16.983829498291016, 22.099014282226562, 27.214202880859375, 32.32939147949219, 37.444576263427734, 42.55976104736328, 47.674949645996094, 52.790138244628906, 57.90532302856445, 63.0205078125, 68.13569641113281, 73.25088500976562, 78.36607360839844, 83.48125457763672, 88.59644317626953, 93.71163177490234, 98.82681274414062, 103.94200134277344, 109.05718994140625, 114.17237854003906, 119.28756713867188, 124.40274810791016, 129.5179443359375, 134.63311767578125, 139.74830627441406, 144.86349487304688, 149.97869873046875, 155.09388732910156, 160.20907592773438, 165.3242645263672, 170.439453125, 175.55462646484375, 180.66981506347656, 185.78500366210938, 190.9001922607422, 196.015380859375, 201.1305694580078, 206.24575805664062, 211.36093139648438, 216.4761199951172, 221.59130859375, 226.7064971923828, 231.82168579101562, 236.93687438964844, 242.05206298828125, 247.16725158691406, 252.28244018554688, 257.3976135253906, 262.5128173828125, 267.62799072265625, 272.7431640625, 277.85833740234375, 282.9735412597656, 288.0887145996094, 293.20391845703125, 298.319091796875, 303.4342956542969, 308.5494689941406, 313.6646728515625]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 8.0, 9.0, 5.0, 8.0, 19.0, 12.0, 26.0, 11.0, 19.0, 24.0, 20.0, 38.0, 24.0, 24.0, 32.0, 37.0, 39.0, 44.0, 56.0, 35.0, 39.0, 39.0, 54.0, 42.0, 40.0, 35.0, 30.0, 36.0, 28.0, 34.0, 18.0, 20.0, 15.0, 10.0, 9.0, 13.0, 13.0, 13.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.21308135986328, -58.29692459106445, -56.380767822265625, -54.46461486816406, -52.548458099365234, -50.632301330566406, -48.71614456176758, -46.79998779296875, -44.88383483886719, -42.96767807006836, -41.05152130126953, -39.13536834716797, -37.21921157836914, -35.30305480957031, -33.386898040771484, -31.47074317932129, -29.55458641052246, -27.638429641723633, -25.722274780273438, -23.80611801147461, -21.889963150024414, -19.973806381225586, -18.05765151977539, -16.141494750976562, -14.22533893585205, -12.309183120727539, -10.393027305603027, -8.476871490478516, -6.560715198516846, -4.644558906555176, -2.728403091430664, -0.8122472763061523, 1.1039085388183594, 3.020064353942871, 4.936220169067383, 6.852376461029053, 8.768531799316406, 10.684688568115234, 12.600844383239746, 14.517000198364258, 16.433155059814453, 18.34931182861328, 20.265466690063477, 22.181623458862305, 24.0977783203125, 26.013935089111328, 27.930091857910156, 29.84624671936035, 31.76240348815918, 33.678558349609375, 35.5947151184082, 37.51087188720703, 39.42702865600586, 41.34318542480469, 43.25933837890625, 45.17549514770508, 47.091651916503906, 49.007808685302734, 50.92396545410156, 52.840118408203125, 54.75627517700195, 56.67243194580078, 58.58858871459961, 60.50474548339844, 62.4208984375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 1.0, 9.0, 4.0, 5.0, 9.0, 16.0, 9.0, 10.0, 27.0, 14.0, 18.0, 27.0, 25.0, 23.0, 29.0, 37.0, 33.0, 41.0, 51.0, 32.0, 48.0, 43.0, 41.0, 31.0, 52.0, 47.0, 23.0, 38.0, 42.0, 31.0, 24.0, 35.0, 21.0, 18.0, 18.0, 10.0, 6.0, 12.0, 10.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.3828125, -10.0902099609375, -9.797607421875, -9.5050048828125, -9.21240234375, -8.9197998046875, -8.627197265625, -8.3345947265625, -8.0419921875, -7.7493896484375, -7.456787109375, -7.1641845703125, -6.87158203125, -6.5789794921875, -6.286376953125, -5.9937744140625, -5.701171875, -5.4085693359375, -5.115966796875, -4.8233642578125, -4.53076171875, -4.2381591796875, -3.945556640625, -3.6529541015625, -3.3603515625, -3.0677490234375, -2.775146484375, -2.4825439453125, -2.18994140625, -1.8973388671875, -1.604736328125, -1.3121337890625, -1.01953125, -0.7269287109375, -0.434326171875, -0.1417236328125, 0.15087890625, 0.4434814453125, 0.736083984375, 1.0286865234375, 1.3212890625, 1.6138916015625, 1.906494140625, 2.1990966796875, 2.49169921875, 2.7843017578125, 3.076904296875, 3.3695068359375, 3.662109375, 3.9547119140625, 4.247314453125, 4.5399169921875, 4.83251953125, 5.1251220703125, 5.417724609375, 5.7103271484375, 6.0029296875, 6.2955322265625, 6.588134765625, 6.8807373046875, 7.17333984375, 7.4659423828125, 7.758544921875, 8.0511474609375, 8.34375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 9.0, 11.0, 16.0, 13.0, 25.0, 39.0, 54.0, 74.0, 95.0, 136.0, 222.0, 374.0, 714.0, 1530.0, 3854.0, 11812.0, 43088.0, 177190.0, 656773.0, 1511787.0, 1213300.0, 424470.0, 108388.0, 27026.0, 7782.0, 2793.0, 1123.0, 613.0, 331.0, 168.0, 145.0, 102.0, 51.0, 35.0, 36.0, 23.0, 16.0, 12.0, 14.0, 11.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.1497802734375, -9.830810546875, -9.5118408203125, -9.19287109375, -8.8739013671875, -8.554931640625, -8.2359619140625, -7.9169921875, -7.5980224609375, -7.279052734375, -6.9600830078125, -6.64111328125, -6.3221435546875, -6.003173828125, -5.6842041015625, -5.365234375, -5.0462646484375, -4.727294921875, -4.4083251953125, -4.08935546875, -3.7703857421875, -3.451416015625, -3.1324462890625, -2.8134765625, -2.4945068359375, -2.175537109375, -1.8565673828125, -1.53759765625, -1.2186279296875, -0.899658203125, -0.5806884765625, -0.26171875, 0.0572509765625, 0.376220703125, 0.6951904296875, 1.01416015625, 1.3331298828125, 1.652099609375, 1.9710693359375, 2.2900390625, 2.6090087890625, 2.927978515625, 3.2469482421875, 3.56591796875, 3.8848876953125, 4.203857421875, 4.5228271484375, 4.841796875, 5.1607666015625, 5.479736328125, 5.7987060546875, 6.11767578125, 6.4366455078125, 6.755615234375, 7.0745849609375, 7.3935546875, 7.7125244140625, 8.031494140625, 8.3504638671875, 8.66943359375, 8.9884033203125, 9.307373046875, 9.6263427734375, 9.9453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 10.0, 7.0, 15.0, 9.0, 25.0, 19.0, 42.0, 47.0, 77.0, 101.0, 144.0, 225.0, 290.0, 424.0, 479.0, 526.0, 415.0, 357.0, 245.0, 194.0, 127.0, 93.0, 54.0, 37.0, 27.0, 28.0, 15.0, 13.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.0859375, -13.64892578125, -13.2119140625, -12.77490234375, -12.337890625, -11.90087890625, -11.4638671875, -11.02685546875, -10.58984375, -10.15283203125, -9.7158203125, -9.27880859375, -8.841796875, -8.40478515625, -7.9677734375, -7.53076171875, -7.09375, -6.65673828125, -6.2197265625, -5.78271484375, -5.345703125, -4.90869140625, -4.4716796875, -4.03466796875, -3.59765625, -3.16064453125, -2.7236328125, -2.28662109375, -1.849609375, -1.41259765625, -0.9755859375, -0.53857421875, -0.1015625, 0.33544921875, 0.7724609375, 1.20947265625, 1.646484375, 2.08349609375, 2.5205078125, 2.95751953125, 3.39453125, 3.83154296875, 4.2685546875, 4.70556640625, 5.142578125, 5.57958984375, 6.0166015625, 6.45361328125, 6.890625, 7.32763671875, 7.7646484375, 8.20166015625, 8.638671875, 9.07568359375, 9.5126953125, 9.94970703125, 10.38671875, 10.82373046875, 11.2607421875, 11.69775390625, 12.134765625, 12.57177734375, 13.0087890625, 13.44580078125, 13.8828125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 4.0, 8.0, 7.0, 10.0, 15.0, 31.0, 32.0, 42.0, 70.0, 78.0, 190.0, 253.0, 537.0, 1065.0, 2531.0, 7641.0, 27919.0, 148319.0, 1215655.0, 2372509.0, 344528.0, 53578.0, 12392.0, 3777.0, 1461.0, 663.0, 344.0, 206.0, 122.0, 79.0, 64.0, 40.0, 27.0, 28.0, 14.0, 6.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.21875, -17.635009765625, -17.05126953125, -16.467529296875, -15.8837890625, -15.300048828125, -14.71630859375, -14.132568359375, -13.548828125, -12.965087890625, -12.38134765625, -11.797607421875, -11.2138671875, -10.630126953125, -10.04638671875, -9.462646484375, -8.87890625, -8.295166015625, -7.71142578125, -7.127685546875, -6.5439453125, -5.960205078125, -5.37646484375, -4.792724609375, -4.208984375, -3.625244140625, -3.04150390625, -2.457763671875, -1.8740234375, -1.290283203125, -0.70654296875, -0.122802734375, 0.4609375, 1.044677734375, 1.62841796875, 2.212158203125, 2.7958984375, 3.379638671875, 3.96337890625, 4.547119140625, 5.130859375, 5.714599609375, 6.29833984375, 6.882080078125, 7.4658203125, 8.049560546875, 8.63330078125, 9.217041015625, 9.80078125, 10.384521484375, 10.96826171875, 11.552001953125, 12.1357421875, 12.719482421875, 13.30322265625, 13.886962890625, 14.470703125, 15.054443359375, 15.63818359375, 16.221923828125, 16.8056640625, 17.389404296875, 17.97314453125, 18.556884765625, 19.140625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 32.0, 386.0, 547.0, 49.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.45945739746094, -203.35934448242188, -193.2592315673828, -183.15911865234375, -173.0590057373047, -162.95889282226562, -152.85877990722656, -142.7586669921875, -132.65855407714844, -122.55844116210938, -112.45832824707031, -102.35821533203125, -92.25810241699219, -82.15798950195312, -72.05787658691406, -61.957763671875, -51.85765075683594, -41.757537841796875, -31.657424926757812, -21.55731201171875, -11.457199096679688, -1.357086181640625, 8.743026733398438, 18.8431396484375, 28.943252563476562, 39.043365478515625, 49.14347839355469, 59.24359130859375, 69.34370422363281, 79.44381713867188, 89.54393005371094, 99.64404296875, 109.744140625, 119.84425354003906, 129.94436645507812, 140.0444793701172, 150.14459228515625, 160.2447052001953, 170.34481811523438, 180.44493103027344, 190.5450439453125, 200.64515686035156, 210.74526977539062, 220.8453826904297, 230.94549560546875, 241.0456085205078, 251.14572143554688, 261.245849609375, 271.345947265625, 281.446044921875, 291.5461730957031, 301.64630126953125, 311.74639892578125, 321.84649658203125, 331.9466247558594, 342.0467529296875, 352.1468505859375, 362.2469482421875, 372.3470764160156, 382.44720458984375, 392.54730224609375, 402.64739990234375, 412.7475280761719, 422.84765625, 432.94775390625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 11.0, 11.0, 12.0, 8.0, 20.0, 14.0, 25.0, 20.0, 27.0, 28.0, 27.0, 31.0, 40.0, 37.0, 46.0, 48.0, 51.0, 38.0, 54.0, 44.0, 46.0, 40.0, 35.0, 29.0, 31.0, 30.0, 26.0, 34.0, 24.0, 21.0, 9.0, 16.0, 11.0, 2.0, 10.0, 4.0, 3.0, 6.0, 3.0, 4.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.23390579223633, -41.83201217651367, -40.43012237548828, -39.028228759765625, -37.626338958740234, -36.22444534301758, -34.82255554199219, -33.42066192626953, -32.018768310546875, -30.61687660217285, -29.214984893798828, -27.813091278076172, -26.41119956970215, -25.009307861328125, -23.6074161529541, -22.205524444580078, -20.803632736206055, -19.40174102783203, -17.999849319458008, -16.597957611083984, -15.196063995361328, -13.794172286987305, -12.392280578613281, -10.990387916564941, -9.588496208190918, -8.186604499816895, -6.784711837768555, -5.382820129394531, -3.9809279441833496, -2.579035758972168, -1.1771440505981445, 0.2247486114501953, 1.6266403198242188, 3.0285325050354004, 4.430424690246582, 5.8323163986206055, 7.234208583831787, 8.636100769042969, 10.037992477416992, 11.439885139465332, 12.841776847839355, 14.243668556213379, 15.645561218261719, 17.047452926635742, 18.449344635009766, 19.851238250732422, 21.253128051757812, 22.65502166748047, 24.056913375854492, 25.458805084228516, 26.86069679260254, 28.262588500976562, 29.66448211669922, 31.066373825073242, 32.468265533447266, 33.87015914916992, 35.27204895019531, 36.67394256591797, 38.07583236694336, 39.477725982666016, 40.879615783691406, 42.28150939941406, 43.68340301513672, 45.08529281616211, 46.487186431884766]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 2.0, 6.0, 5.0, 4.0, 8.0, 8.0, 7.0, 15.0, 19.0, 17.0, 18.0, 19.0, 25.0, 26.0, 28.0, 42.0, 35.0, 35.0, 33.0, 40.0, 34.0, 35.0, 43.0, 47.0, 39.0, 50.0, 35.0, 34.0, 35.0, 38.0, 27.0, 28.0, 37.0, 25.0, 23.0, 10.0, 12.0, 9.0, 7.0, 2.0, 8.0, 6.0, 10.0, 4.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.5234375, -9.239501953125, -8.95556640625, -8.671630859375, -8.3876953125, -8.103759765625, -7.81982421875, -7.535888671875, -7.251953125, -6.968017578125, -6.68408203125, -6.400146484375, -6.1162109375, -5.832275390625, -5.54833984375, -5.264404296875, -4.98046875, -4.696533203125, -4.41259765625, -4.128662109375, -3.8447265625, -3.560791015625, -3.27685546875, -2.992919921875, -2.708984375, -2.425048828125, -2.14111328125, -1.857177734375, -1.5732421875, -1.289306640625, -1.00537109375, -0.721435546875, -0.4375, -0.153564453125, 0.13037109375, 0.414306640625, 0.6982421875, 0.982177734375, 1.26611328125, 1.550048828125, 1.833984375, 2.117919921875, 2.40185546875, 2.685791015625, 2.9697265625, 3.253662109375, 3.53759765625, 3.821533203125, 4.10546875, 4.389404296875, 4.67333984375, 4.957275390625, 5.2412109375, 5.525146484375, 5.80908203125, 6.093017578125, 6.376953125, 6.660888671875, 6.94482421875, 7.228759765625, 7.5126953125, 7.796630859375, 8.08056640625, 8.364501953125, 8.6484375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 5.0, 16.0, 13.0, 19.0, 41.0, 36.0, 61.0, 94.0, 170.0, 240.0, 444.0, 674.0, 1132.0, 1815.0, 2968.0, 4890.0, 8190.0, 13206.0, 22279.0, 37130.0, 63880.0, 109407.0, 185858.0, 230015.0, 150827.0, 87976.0, 51386.0, 29993.0, 18043.0, 10741.0, 6587.0, 3971.0, 2476.0, 1501.0, 935.0, 522.0, 378.0, 237.0, 139.0, 102.0, 59.0, 39.0, 21.0, 19.0, 14.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8525390625, -0.826934814453125, -0.80133056640625, -0.775726318359375, -0.7501220703125, -0.724517822265625, -0.69891357421875, -0.673309326171875, -0.647705078125, -0.622100830078125, -0.59649658203125, -0.570892333984375, -0.5452880859375, -0.519683837890625, -0.49407958984375, -0.468475341796875, -0.44287109375, -0.417266845703125, -0.39166259765625, -0.366058349609375, -0.3404541015625, -0.314849853515625, -0.28924560546875, -0.263641357421875, -0.238037109375, -0.212432861328125, -0.18682861328125, -0.161224365234375, -0.1356201171875, -0.110015869140625, -0.08441162109375, -0.058807373046875, -0.033203125, -0.007598876953125, 0.01800537109375, 0.043609619140625, 0.0692138671875, 0.094818115234375, 0.12042236328125, 0.146026611328125, 0.171630859375, 0.197235107421875, 0.22283935546875, 0.248443603515625, 0.2740478515625, 0.299652099609375, 0.32525634765625, 0.350860595703125, 0.37646484375, 0.402069091796875, 0.42767333984375, 0.453277587890625, 0.4788818359375, 0.504486083984375, 0.53009033203125, 0.555694580078125, 0.581298828125, 0.606903076171875, 0.63250732421875, 0.658111572265625, 0.6837158203125, 0.709320068359375, 0.73492431640625, 0.760528564453125, 0.7861328125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 14.0, 7.0, 12.0, 17.0, 28.0, 15.0, 23.0, 26.0, 34.0, 26.0, 44.0, 46.0, 35.0, 31.0, 54.0, 45.0, 1078.0, 46.0, 53.0, 35.0, 40.0, 37.0, 27.0, 35.0, 41.0, 22.0, 28.0, 19.0, 18.0, 20.0, 13.0, 12.0, 3.0, 10.0, 2.0, 5.0, 6.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.669189453125, -5.47509765625, -5.281005859375, -5.0869140625, -4.892822265625, -4.69873046875, -4.504638671875, -4.310546875, -4.116455078125, -3.92236328125, -3.728271484375, -3.5341796875, -3.340087890625, -3.14599609375, -2.951904296875, -2.7578125, -2.563720703125, -2.36962890625, -2.175537109375, -1.9814453125, -1.787353515625, -1.59326171875, -1.399169921875, -1.205078125, -1.010986328125, -0.81689453125, -0.622802734375, -0.4287109375, -0.234619140625, -0.04052734375, 0.153564453125, 0.34765625, 0.541748046875, 0.73583984375, 0.929931640625, 1.1240234375, 1.318115234375, 1.51220703125, 1.706298828125, 1.900390625, 2.094482421875, 2.28857421875, 2.482666015625, 2.6767578125, 2.870849609375, 3.06494140625, 3.259033203125, 3.453125, 3.647216796875, 3.84130859375, 4.035400390625, 4.2294921875, 4.423583984375, 4.61767578125, 4.811767578125, 5.005859375, 5.199951171875, 5.39404296875, 5.588134765625, 5.7822265625, 5.976318359375, 6.17041015625, 6.364501953125, 6.55859375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 13.0, 18.0, 21.0, 41.0, 48.0, 84.0, 136.0, 174.0, 285.0, 429.0, 678.0, 1089.0, 1652.0, 2451.0, 3846.0, 5847.0, 9031.0, 13935.0, 21447.0, 33371.0, 50735.0, 78891.0, 121607.0, 281174.0, 1114926.0, 124755.0, 81000.0, 52282.0, 34108.0, 22327.0, 14111.0, 9252.0, 6098.0, 3881.0, 2557.0, 1657.0, 1127.0, 666.0, 476.0, 300.0, 230.0, 128.0, 84.0, 60.0, 37.0, 25.0, 17.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.57177734375, -0.5533523559570312, -0.5349273681640625, -0.5165023803710938, -0.498077392578125, -0.47965240478515625, -0.4612274169921875, -0.44280242919921875, -0.42437744140625, -0.40595245361328125, -0.3875274658203125, -0.36910247802734375, -0.350677490234375, -0.33225250244140625, -0.3138275146484375, -0.29540252685546875, -0.2769775390625, -0.25855255126953125, -0.2401275634765625, -0.22170257568359375, -0.203277587890625, -0.18485260009765625, -0.1664276123046875, -0.14800262451171875, -0.12957763671875, -0.11115264892578125, -0.0927276611328125, -0.07430267333984375, -0.055877685546875, -0.03745269775390625, -0.0190277099609375, -0.00060272216796875, 0.017822265625, 0.03624725341796875, 0.0546722412109375, 0.07309722900390625, 0.091522216796875, 0.10994720458984375, 0.1283721923828125, 0.14679718017578125, 0.16522216796875, 0.18364715576171875, 0.2020721435546875, 0.22049713134765625, 0.238922119140625, 0.25734710693359375, 0.2757720947265625, 0.29419708251953125, 0.3126220703125, 0.33104705810546875, 0.3494720458984375, 0.36789703369140625, 0.386322021484375, 0.40474700927734375, 0.4231719970703125, 0.44159698486328125, 0.46002197265625, 0.47844696044921875, 0.4968719482421875, 0.5152969360351562, 0.533721923828125, 0.5521469116210938, 0.5705718994140625, 0.5889968872070312, 0.607421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 5.0, 5.0, 9.0, 12.0, 15.0, 19.0, 22.0, 30.0, 21.0, 41.0, 39.0, 52.0, 55.0, 48.0, 52.0, 63.0, 68.0, 57.0, 47.0, 48.0, 37.0, 56.0, 47.0, 37.0, 28.0, 17.0, 25.0, 17.0, 9.0, 10.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002513885498046875, -0.0024206936359405518, -0.0023275017738342285, -0.0022343099117279053, -0.002141118049621582, -0.002047926187515259, -0.0019547343254089355, -0.0018615424633026123, -0.001768350601196289, -0.0016751587390899658, -0.0015819668769836426, -0.0014887750148773193, -0.001395583152770996, -0.0013023912906646729, -0.0012091994285583496, -0.0011160075664520264, -0.0010228157043457031, -0.0009296238422393799, -0.0008364319801330566, -0.0007432401180267334, -0.0006500482559204102, -0.0005568563938140869, -0.00046366453170776367, -0.00037047266960144043, -0.0002772808074951172, -0.00018408894538879395, -9.08970832824707e-05, 2.294778823852539e-06, 9.548664093017578e-05, 0.00018867850303649902, 0.00028187036514282227, 0.0003750622272491455, 0.00046825408935546875, 0.000561445951461792, 0.0006546378135681152, 0.0007478296756744385, 0.0008410215377807617, 0.000934213399887085, 0.0010274052619934082, 0.0011205971240997314, 0.0012137889862060547, 0.001306980848312378, 0.0014001727104187012, 0.0014933645725250244, 0.0015865564346313477, 0.001679748296737671, 0.0017729401588439941, 0.0018661320209503174, 0.0019593238830566406, 0.002052515745162964, 0.002145707607269287, 0.0022388994693756104, 0.0023320913314819336, 0.002425283193588257, 0.00251847505569458, 0.0026116669178009033, 0.0027048587799072266, 0.00279805064201355, 0.002891242504119873, 0.0029844343662261963, 0.0030776262283325195, 0.0031708180904388428, 0.003264009952545166, 0.0033572018146514893, 0.0034503936767578125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 4.0, 14.0, 24.0, 28.0, 43.0, 40.0, 57.0, 88.0, 98.0, 134.0, 176.0, 289.0, 549.0, 1040.0, 57291.0, 985205.0, 1641.0, 642.0, 357.0, 241.0, 165.0, 93.0, 58.0, 69.0, 47.0, 35.0, 37.0, 20.0, 17.0, 12.0, 10.0, 10.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.06158447265625, -0.05988311767578125, -0.0581817626953125, -0.05648040771484375, -0.054779052734375, -0.05307769775390625, -0.0513763427734375, -0.04967498779296875, -0.0479736328125, -0.04627227783203125, -0.0445709228515625, -0.04286956787109375, -0.041168212890625, -0.03946685791015625, -0.0377655029296875, -0.03606414794921875, -0.03436279296875, -0.03266143798828125, -0.0309600830078125, -0.02925872802734375, -0.027557373046875, -0.02585601806640625, -0.0241546630859375, -0.02245330810546875, -0.020751953125, -0.01905059814453125, -0.0173492431640625, -0.01564788818359375, -0.013946533203125, -0.01224517822265625, -0.0105438232421875, -0.00884246826171875, -0.00714111328125, -0.00543975830078125, -0.0037384033203125, -0.00203704833984375, -0.000335693359375, 0.00136566162109375, 0.0030670166015625, 0.00476837158203125, 0.0064697265625, 0.00817108154296875, 0.0098724365234375, 0.01157379150390625, 0.013275146484375, 0.01497650146484375, 0.0166778564453125, 0.01837921142578125, 0.02008056640625, 0.02178192138671875, 0.0234832763671875, 0.02518463134765625, 0.026885986328125, 0.02858734130859375, 0.0302886962890625, 0.03199005126953125, 0.03369140625, 0.03539276123046875, 0.0370941162109375, 0.03879547119140625, 0.040496826171875, 0.04219818115234375, 0.0438995361328125, 0.04560089111328125, 0.04730224609375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 20.0, 97.0, 324.0, 405.0, 135.0, 25.0, 6.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.007933234795928001, -0.007791867479681969, -0.007650499697774649, -0.007509132381528616, -0.007367765065282583, -0.0072263977490365505, -0.0070850299671292305, -0.006943662650883198, -0.006802295334637165, -0.006660928018391132, -0.006519560236483812, -0.00637819292023778, -0.006236825603991747, -0.006095458287745714, -0.005954090505838394, -0.0058127231895923615, -0.005671355873346329, -0.005529988557100296, -0.005388620775192976, -0.005247253458946943, -0.005105886142700911, -0.004964518826454878, -0.004823151044547558, -0.004681783728301525, -0.004540415946394205, -0.004399048630148172, -0.004257680848240852, -0.00411631353199482, -0.003974946215748787, -0.0038335786666721106, -0.003692211117595434, -0.0035508438013494015, -0.003409476252272725, -0.0032681087031960487, -0.003126741386950016, -0.0029853738378733397, -0.002844006521627307, -0.0027026389725506306, -0.002561271656304598, -0.0024199041072279215, -0.002278536558151245, -0.0021371690090745687, -0.001995801692828536, -0.0018544341437518597, -0.001713066827505827, -0.0015716992784291506, -0.001430331845767796, -0.0012889644131064415, -0.0011475970968604088, -0.0010062296641990542, -0.0008648622315376997, -0.0007234947406686842, -0.0005821273080073297, -0.00044075987534597516, -0.0002993923844769597, -0.00015802495181560516, -1.6657519154250622e-05, 0.00012470992805901915, 0.0002660773752722889, 0.0004074448370374739, 0.0005488122696988285, 0.000690179702360183, 0.0008315471932291985, 0.000972914625890553, 0.0011142820585519075]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 8.0, 6.0, 5.0, 5.0, 3.0, 9.0, 12.0, 15.0, 14.0, 16.0, 20.0, 21.0, 30.0, 29.0, 33.0, 39.0, 42.0, 32.0, 31.0, 32.0, 36.0, 41.0, 41.0, 35.0, 36.0, 45.0, 35.0, 33.0, 33.0, 39.0, 25.0, 27.0, 23.0, 27.0, 16.0, 20.0, 13.0, 9.0, 13.0, 11.0, 4.0, 9.0, 5.0, 8.0, 1.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011650919914245605, -0.001124613918364048, -0.0010841358453035355, -0.001043657772243023, -0.0010031796991825104, -0.0009627016261219978, -0.0009222235530614853, -0.0008817454800009727, -0.0008412674069404602, -0.0008007893338799477, -0.0007603112608194351, -0.0007198331877589226, -0.00067935511469841, -0.0006388770416378975, -0.000598398968577385, -0.0005579208955168724, -0.0005174428224563599, -0.0004769647493958473, -0.0004364866763353348, -0.00039600860327482224, -0.0003555305302143097, -0.00031505245715379715, -0.0002745743840932846, -0.00023409631103277206, -0.00019361823797225952, -0.00015314016491174698, -0.00011266209185123444, -7.21840187907219e-05, -3.170594573020935e-05, 8.772127330303192e-06, 4.9250200390815735e-05, 8.972827345132828e-05, 0.00013020634651184082, 0.00017068441957235336, 0.0002111624926328659, 0.00025164056569337845, 0.000292118638753891, 0.00033259671181440353, 0.0003730747848749161, 0.0004135528579354286, 0.00045403093099594116, 0.0004945090040564537, 0.0005349870771169662, 0.0005754651501774788, 0.0006159432232379913, 0.0006564212962985039, 0.0006968993693590164, 0.000737377442419529, 0.0007778555154800415, 0.000818333588540554, 0.0008588116616010666, 0.0008992897346615791, 0.0009397678077220917, 0.0009802458807826042, 0.0010207239538431168, 0.0010612020269036293, 0.0011016800999641418, 0.0011421581730246544, 0.001182636246085167, 0.0012231143191456795, 0.001263592392206192, 0.0013040704652667046, 0.001344548538327217, 0.0013850266113877296, 0.0014255046844482422]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 2.0, 6.0, 5.0, 4.0, 8.0, 8.0, 7.0, 15.0, 19.0, 17.0, 18.0, 19.0, 25.0, 26.0, 28.0, 42.0, 35.0, 35.0, 33.0, 40.0, 34.0, 35.0, 43.0, 47.0, 39.0, 50.0, 35.0, 34.0, 35.0, 38.0, 27.0, 28.0, 37.0, 25.0, 23.0, 10.0, 12.0, 9.0, 7.0, 2.0, 8.0, 6.0, 10.0, 4.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.5234375, -9.239501953125, -8.95556640625, -8.671630859375, -8.3876953125, -8.103759765625, -7.81982421875, -7.535888671875, -7.251953125, -6.968017578125, -6.68408203125, -6.400146484375, -6.1162109375, -5.832275390625, -5.54833984375, -5.264404296875, -4.98046875, -4.696533203125, -4.41259765625, -4.128662109375, -3.8447265625, -3.560791015625, -3.27685546875, -2.992919921875, -2.708984375, -2.425048828125, -2.14111328125, -1.857177734375, -1.5732421875, -1.289306640625, -1.00537109375, -0.721435546875, -0.4375, -0.153564453125, 0.13037109375, 0.414306640625, 0.6982421875, 0.982177734375, 1.26611328125, 1.550048828125, 1.833984375, 2.117919921875, 2.40185546875, 2.685791015625, 2.9697265625, 3.253662109375, 3.53759765625, 3.821533203125, 4.10546875, 4.389404296875, 4.67333984375, 4.957275390625, 5.2412109375, 5.525146484375, 5.80908203125, 6.093017578125, 6.376953125, 6.660888671875, 6.94482421875, 7.228759765625, 7.5126953125, 7.796630859375, 8.08056640625, 8.364501953125, 8.6484375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 15.0, 18.0, 17.0, 26.0, 26.0, 43.0, 41.0, 44.0, 86.0, 102.0, 161.0, 174.0, 275.0, 381.0, 629.0, 1155.0, 2155.0, 4255.0, 10749.0, 29942.0, 85989.0, 243182.0, 385457.0, 182089.0, 63355.0, 21966.0, 8156.0, 3555.0, 1691.0, 938.0, 566.0, 316.0, 240.0, 192.0, 130.0, 113.0, 75.0, 53.0, 40.0, 39.0, 30.0, 16.0, 19.0, 11.0, 7.0, 12.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.1640625, -11.776123046875, -11.38818359375, -11.000244140625, -10.6123046875, -10.224365234375, -9.83642578125, -9.448486328125, -9.060546875, -8.672607421875, -8.28466796875, -7.896728515625, -7.5087890625, -7.120849609375, -6.73291015625, -6.344970703125, -5.95703125, -5.569091796875, -5.18115234375, -4.793212890625, -4.4052734375, -4.017333984375, -3.62939453125, -3.241455078125, -2.853515625, -2.465576171875, -2.07763671875, -1.689697265625, -1.3017578125, -0.913818359375, -0.52587890625, -0.137939453125, 0.25, 0.637939453125, 1.02587890625, 1.413818359375, 1.8017578125, 2.189697265625, 2.57763671875, 2.965576171875, 3.353515625, 3.741455078125, 4.12939453125, 4.517333984375, 4.9052734375, 5.293212890625, 5.68115234375, 6.069091796875, 6.45703125, 6.844970703125, 7.23291015625, 7.620849609375, 8.0087890625, 8.396728515625, 8.78466796875, 9.172607421875, 9.560546875, 9.948486328125, 10.33642578125, 10.724365234375, 11.1123046875, 11.500244140625, 11.88818359375, 12.276123046875, 12.6640625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 1.0, 9.0, 7.0, 8.0, 12.0, 15.0, 26.0, 21.0, 28.0, 31.0, 32.0, 37.0, 49.0, 59.0, 58.0, 116.0, 193.0, 315.0, 1315.0, 179.0, 102.0, 82.0, 64.0, 48.0, 36.0, 35.0, 32.0, 23.0, 19.0, 12.0, 17.0, 15.0, 16.0, 9.0, 5.0, 5.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.1875, -22.388427734375, -21.58935546875, -20.790283203125, -19.9912109375, -19.192138671875, -18.39306640625, -17.593994140625, -16.794921875, -15.995849609375, -15.19677734375, -14.397705078125, -13.5986328125, -12.799560546875, -12.00048828125, -11.201416015625, -10.40234375, -9.603271484375, -8.80419921875, -8.005126953125, -7.2060546875, -6.406982421875, -5.60791015625, -4.808837890625, -4.009765625, -3.210693359375, -2.41162109375, -1.612548828125, -0.8134765625, -0.014404296875, 0.78466796875, 1.583740234375, 2.3828125, 3.181884765625, 3.98095703125, 4.780029296875, 5.5791015625, 6.378173828125, 7.17724609375, 7.976318359375, 8.775390625, 9.574462890625, 10.37353515625, 11.172607421875, 11.9716796875, 12.770751953125, 13.56982421875, 14.368896484375, 15.16796875, 15.967041015625, 16.76611328125, 17.565185546875, 18.3642578125, 19.163330078125, 19.96240234375, 20.761474609375, 21.560546875, 22.359619140625, 23.15869140625, 23.957763671875, 24.7568359375, 25.555908203125, 26.35498046875, 27.154052734375, 27.953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 5.0, 14.0, 11.0, 18.0, 17.0, 37.0, 39.0, 76.0, 80.0, 133.0, 222.0, 290.0, 514.0, 1034.0, 5748.0, 507501.0, 2612138.0, 14714.0, 1380.0, 626.0, 375.0, 252.0, 133.0, 101.0, 56.0, 54.0, 29.0, 30.0, 21.0, 18.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.15625, -46.24072265625, -44.3251953125, -42.40966796875, -40.494140625, -38.57861328125, -36.6630859375, -34.74755859375, -32.83203125, -30.91650390625, -29.0009765625, -27.08544921875, -25.169921875, -23.25439453125, -21.3388671875, -19.42333984375, -17.5078125, -15.59228515625, -13.6767578125, -11.76123046875, -9.845703125, -7.93017578125, -6.0146484375, -4.09912109375, -2.18359375, -0.26806640625, 1.6474609375, 3.56298828125, 5.478515625, 7.39404296875, 9.3095703125, 11.22509765625, 13.140625, 15.05615234375, 16.9716796875, 18.88720703125, 20.802734375, 22.71826171875, 24.6337890625, 26.54931640625, 28.46484375, 30.38037109375, 32.2958984375, 34.21142578125, 36.126953125, 38.04248046875, 39.9580078125, 41.87353515625, 43.7890625, 45.70458984375, 47.6201171875, 49.53564453125, 51.451171875, 53.36669921875, 55.2822265625, 57.19775390625, 59.11328125, 61.02880859375, 62.9443359375, 64.85986328125, 66.775390625, 68.69091796875, 70.6064453125, 72.52197265625, 74.4375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 14.0, 96.0, 318.0, 412.0, 146.0, 23.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.877758026123047, -24.12710952758789, -19.376461029052734, -14.625810623168945, -9.875162124633789, -5.124513626098633, -0.37386322021484375, 4.3767852783203125, 9.127433776855469, 13.878082275390625, 18.62873077392578, 23.37938117980957, 28.130029678344727, 32.88067626953125, 37.63132858276367, 42.38197708129883, 47.132625579833984, 51.88327407836914, 56.6339225769043, 61.38457489013672, 66.13522338867188, 70.88587188720703, 75.63652038574219, 80.38716888427734, 85.1378173828125, 89.88846588134766, 94.63911437988281, 99.38976287841797, 104.14041137695312, 108.89105987548828, 113.64170837402344, 118.39236450195312, 123.14302062988281, 127.89366912841797, 132.64431762695312, 137.3949737548828, 142.14561462402344, 146.89627075195312, 151.64691162109375, 156.39756774902344, 161.14820861816406, 165.89886474609375, 170.64950561523438, 175.40016174316406, 180.1508026123047, 184.90145874023438, 189.652099609375, 194.4027557373047, 199.15341186523438, 203.90406799316406, 208.6547088623047, 213.40536499023438, 218.156005859375, 222.9066619873047, 227.6573028564453, 232.407958984375, 237.15859985351562, 241.9092559814453, 246.65989685058594, 251.41055297851562, 256.16119384765625, 260.9118347167969, 265.6625061035156, 270.41314697265625, 275.1637878417969]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 9.0, 9.0, 6.0, 11.0, 19.0, 19.0, 18.0, 18.0, 19.0, 24.0, 34.0, 34.0, 30.0, 26.0, 34.0, 29.0, 29.0, 31.0, 34.0, 38.0, 45.0, 50.0, 31.0, 25.0, 36.0, 22.0, 36.0, 41.0, 29.0, 25.0, 19.0, 18.0, 22.0, 19.0, 16.0, 23.0, 14.0, 5.0, 9.0, 11.0, 5.0, 7.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.03937530517578, -41.484378814697266, -39.92938232421875, -38.374385833740234, -36.81938934326172, -35.2643928527832, -33.70939636230469, -32.15440368652344, -30.59940528869629, -29.044408798217773, -27.489412307739258, -25.934417724609375, -24.37942123413086, -22.824424743652344, -21.269428253173828, -19.714431762695312, -18.159435272216797, -16.60443878173828, -15.049442291259766, -13.494446754455566, -11.93945026397705, -10.384453773498535, -8.829458236694336, -7.27446174621582, -5.719465255737305, -4.164468765258789, -2.6094727516174316, -1.0544767379760742, 0.5005197525024414, 2.055516242980957, 3.6105117797851562, 5.165508270263672, 6.7205047607421875, 8.275501251220703, 9.830497741699219, 11.385493278503418, 12.940489768981934, 14.49548625946045, 16.05048179626465, 17.605478286743164, 19.16047477722168, 20.715471267700195, 22.27046775817871, 23.825462341308594, 25.38045883178711, 26.935455322265625, 28.49045181274414, 30.045448303222656, 31.600444793701172, 33.15544128417969, 34.7104377746582, 36.26543426513672, 37.820430755615234, 39.37542724609375, 40.930419921875, 42.48542022705078, 44.04041290283203, 45.59540939331055, 47.15040588378906, 48.70540237426758, 50.260398864746094, 51.81539535522461, 53.370391845703125, 54.925384521484375, 56.480384826660156]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 10.0, 9.0, 8.0, 17.0, 14.0, 11.0, 15.0, 19.0, 15.0, 28.0, 24.0, 27.0, 36.0, 29.0, 30.0, 30.0, 47.0, 35.0, 39.0, 38.0, 39.0, 44.0, 42.0, 35.0, 42.0, 41.0, 40.0, 33.0, 31.0, 31.0, 25.0, 16.0, 8.0, 15.0, 11.0, 9.0, 10.0, 5.0, 6.0, 5.0, 9.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-9.4453125, -9.166259765625, -8.88720703125, -8.608154296875, -8.3291015625, -8.050048828125, -7.77099609375, -7.491943359375, -7.212890625, -6.933837890625, -6.65478515625, -6.375732421875, -6.0966796875, -5.817626953125, -5.53857421875, -5.259521484375, -4.98046875, -4.701416015625, -4.42236328125, -4.143310546875, -3.8642578125, -3.585205078125, -3.30615234375, -3.027099609375, -2.748046875, -2.468994140625, -2.18994140625, -1.910888671875, -1.6318359375, -1.352783203125, -1.07373046875, -0.794677734375, -0.515625, -0.236572265625, 0.04248046875, 0.321533203125, 0.6005859375, 0.879638671875, 1.15869140625, 1.437744140625, 1.716796875, 1.995849609375, 2.27490234375, 2.553955078125, 2.8330078125, 3.112060546875, 3.39111328125, 3.670166015625, 3.94921875, 4.228271484375, 4.50732421875, 4.786376953125, 5.0654296875, 5.344482421875, 5.62353515625, 5.902587890625, 6.181640625, 6.460693359375, 6.73974609375, 7.018798828125, 7.2978515625, 7.576904296875, 7.85595703125, 8.135009765625, 8.4140625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 9.0, 9.0, 21.0, 26.0, 20.0, 25.0, 41.0, 37.0, 67.0, 77.0, 102.0, 140.0, 209.0, 274.0, 373.0, 551.0, 5431.0, 4016327.0, 167874.0, 991.0, 442.0, 288.0, 219.0, 186.0, 123.0, 87.0, 75.0, 47.0, 43.0, 27.0, 28.0, 18.0, 17.0, 17.0, 15.0, 5.0, 8.0, 4.0, 5.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.6875, -87.9990234375, -85.310546875, -82.6220703125, -79.93359375, -77.2451171875, -74.556640625, -71.8681640625, -69.1796875, -66.4912109375, -63.802734375, -61.1142578125, -58.42578125, -55.7373046875, -53.048828125, -50.3603515625, -47.671875, -44.9833984375, -42.294921875, -39.6064453125, -36.91796875, -34.2294921875, -31.541015625, -28.8525390625, -26.1640625, -23.4755859375, -20.787109375, -18.0986328125, -15.41015625, -12.7216796875, -10.033203125, -7.3447265625, -4.65625, -1.9677734375, 0.720703125, 3.4091796875, 6.09765625, 8.7861328125, 11.474609375, 14.1630859375, 16.8515625, 19.5400390625, 22.228515625, 24.9169921875, 27.60546875, 30.2939453125, 32.982421875, 35.6708984375, 38.359375, 41.0478515625, 43.736328125, 46.4248046875, 49.11328125, 51.8017578125, 54.490234375, 57.1787109375, 59.8671875, 62.5556640625, 65.244140625, 67.9326171875, 70.62109375, 73.3095703125, 75.998046875, 78.6865234375, 81.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 15.0, 8.0, 13.0, 21.0, 19.0, 31.0, 50.0, 54.0, 108.0, 123.0, 197.0, 305.0, 474.0, 602.0, 613.0, 439.0, 321.0, 207.0, 144.0, 99.0, 65.0, 35.0, 39.0, 24.0, 18.0, 16.0, 14.0, 9.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.234375, -19.68798828125, -19.1416015625, -18.59521484375, -18.048828125, -17.50244140625, -16.9560546875, -16.40966796875, -15.86328125, -15.31689453125, -14.7705078125, -14.22412109375, -13.677734375, -13.13134765625, -12.5849609375, -12.03857421875, -11.4921875, -10.94580078125, -10.3994140625, -9.85302734375, -9.306640625, -8.76025390625, -8.2138671875, -7.66748046875, -7.12109375, -6.57470703125, -6.0283203125, -5.48193359375, -4.935546875, -4.38916015625, -3.8427734375, -3.29638671875, -2.75, -2.20361328125, -1.6572265625, -1.11083984375, -0.564453125, -0.01806640625, 0.5283203125, 1.07470703125, 1.62109375, 2.16748046875, 2.7138671875, 3.26025390625, 3.806640625, 4.35302734375, 4.8994140625, 5.44580078125, 5.9921875, 6.53857421875, 7.0849609375, 7.63134765625, 8.177734375, 8.72412109375, 9.2705078125, 9.81689453125, 10.36328125, 10.90966796875, 11.4560546875, 12.00244140625, 12.548828125, 13.09521484375, 13.6416015625, 14.18798828125, 14.734375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 10.0, 13.0, 22.0, 31.0, 36.0, 51.0, 83.0, 147.0, 289.0, 1161.0, 47756.0, 4042788.0, 99493.0, 1630.0, 322.0, 165.0, 82.0, 55.0, 33.0, 31.0, 26.0, 22.0, 11.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.6875, -48.44140625, -46.1953125, -43.94921875, -41.703125, -39.45703125, -37.2109375, -34.96484375, -32.71875, -30.47265625, -28.2265625, -25.98046875, -23.734375, -21.48828125, -19.2421875, -16.99609375, -14.75, -12.50390625, -10.2578125, -8.01171875, -5.765625, -3.51953125, -1.2734375, 0.97265625, 3.21875, 5.46484375, 7.7109375, 9.95703125, 12.203125, 14.44921875, 16.6953125, 18.94140625, 21.1875, 23.43359375, 25.6796875, 27.92578125, 30.171875, 32.41796875, 34.6640625, 36.91015625, 39.15625, 41.40234375, 43.6484375, 45.89453125, 48.140625, 50.38671875, 52.6328125, 54.87890625, 57.125, 59.37109375, 61.6171875, 63.86328125, 66.109375, 68.35546875, 70.6015625, 72.84765625, 75.09375, 77.33984375, 79.5859375, 81.83203125, 84.078125, 86.32421875, 88.5703125, 90.81640625, 93.0625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 28.0, 180.0, 483.0, 259.0, 57.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.067626953125, -209.0161895751953, -201.96475219726562, -194.91331481933594, -187.86187744140625, -180.8104248046875, -173.75900268554688, -166.70755004882812, -159.65611267089844, -152.60467529296875, -145.55323791503906, -138.50180053710938, -131.4503631591797, -124.39891815185547, -117.34748077392578, -110.29603576660156, -103.2446060180664, -96.19316864013672, -89.14173126220703, -82.09028625488281, -75.03884887695312, -67.98741149902344, -60.93597412109375, -53.8845329284668, -46.83309555053711, -39.78165817260742, -32.73021697998047, -25.67877960205078, -18.62734031677246, -11.57590103149414, -4.524463653564453, 2.5269775390625, 9.578414916992188, 16.629854202270508, 23.681293487548828, 30.732730865478516, 37.78417205810547, 44.835609436035156, 51.887046813964844, 58.9384880065918, 65.98992919921875, 73.04136657714844, 80.09280395507812, 87.14424133300781, 94.19568634033203, 101.24712371826172, 108.2985610961914, 115.35000610351562, 122.40143585205078, 129.452880859375, 136.5043182373047, 143.55575561523438, 150.60719299316406, 157.65863037109375, 164.71006774902344, 171.76150512695312, 178.8129425048828, 185.8643798828125, 192.9158172607422, 199.96725463867188, 207.01869201660156, 214.07012939453125, 221.12158203125, 228.1730194091797, 235.22445678710938]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 4.0, 8.0, 5.0, 2.0, 12.0, 16.0, 17.0, 17.0, 16.0, 21.0, 16.0, 23.0, 31.0, 33.0, 37.0, 33.0, 33.0, 40.0, 43.0, 49.0, 29.0, 35.0, 40.0, 46.0, 31.0, 39.0, 37.0, 34.0, 34.0, 32.0, 25.0, 18.0, 20.0, 17.0, 18.0, 14.0, 11.0, 7.0, 10.0, 10.0, 12.0, 6.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.22955322265625, -44.726890563964844, -43.22422409057617, -41.721561431884766, -40.21889877319336, -38.71623229980469, -37.21356964111328, -35.710906982421875, -34.20824432373047, -32.70558166503906, -31.202917098999023, -29.700252532958984, -28.197589874267578, -26.69492530822754, -25.1922607421875, -23.689598083496094, -22.186931610107422, -20.684267044067383, -19.181604385375977, -17.678939819335938, -16.17627716064453, -14.673612594604492, -13.170948028564453, -11.66828441619873, -10.165620803833008, -8.662957191467285, -7.160293102264404, -5.657629013061523, -4.154965400695801, -2.652301788330078, -1.149637222290039, 0.3530263900756836, 1.8556861877441406, 3.3583500385284424, 4.861013889312744, 6.363677978515625, 7.866341590881348, 9.36900520324707, 10.87166976928711, 12.374333381652832, 13.876996994018555, 15.379660606384277, 16.88232421875, 18.38498878479004, 19.887653350830078, 21.390316009521484, 22.892980575561523, 24.395645141601562, 25.89830780029297, 27.400972366333008, 28.903635025024414, 30.406299591064453, 31.90896224975586, 33.41162872314453, 34.91429138183594, 36.416954040527344, 37.91961669921875, 39.422279357910156, 40.92494583129883, 42.427608489990234, 43.93027114868164, 45.43293762207031, 46.93560028076172, 48.438262939453125, 49.9409294128418]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 6.0, 7.0, 8.0, 8.0, 9.0, 13.0, 11.0, 18.0, 9.0, 14.0, 17.0, 20.0, 25.0, 21.0, 37.0, 32.0, 30.0, 29.0, 39.0, 48.0, 41.0, 48.0, 41.0, 39.0, 35.0, 40.0, 34.0, 39.0, 26.0, 30.0, 30.0, 26.0, 28.0, 21.0, 17.0, 13.0, 10.0, 15.0, 12.0, 11.0, 6.0, 5.0, 5.0, 4.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-8.7734375, -8.5087890625, -8.244140625, -7.9794921875, -7.71484375, -7.4501953125, -7.185546875, -6.9208984375, -6.65625, -6.3916015625, -6.126953125, -5.8623046875, -5.59765625, -5.3330078125, -5.068359375, -4.8037109375, -4.5390625, -4.2744140625, -4.009765625, -3.7451171875, -3.48046875, -3.2158203125, -2.951171875, -2.6865234375, -2.421875, -2.1572265625, -1.892578125, -1.6279296875, -1.36328125, -1.0986328125, -0.833984375, -0.5693359375, -0.3046875, -0.0400390625, 0.224609375, 0.4892578125, 0.75390625, 1.0185546875, 1.283203125, 1.5478515625, 1.8125, 2.0771484375, 2.341796875, 2.6064453125, 2.87109375, 3.1357421875, 3.400390625, 3.6650390625, 3.9296875, 4.1943359375, 4.458984375, 4.7236328125, 4.98828125, 5.2529296875, 5.517578125, 5.7822265625, 6.046875, 6.3115234375, 6.576171875, 6.8408203125, 7.10546875, 7.3701171875, 7.634765625, 7.8994140625, 8.1640625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 8.0, 4.0, 10.0, 12.0, 14.0, 15.0, 44.0, 44.0, 74.0, 111.0, 156.0, 260.0, 419.0, 622.0, 948.0, 1555.0, 2466.0, 3776.0, 5955.0, 9553.0, 15205.0, 24512.0, 39350.0, 64575.0, 105843.0, 170705.0, 212473.0, 149359.0, 91654.0, 56316.0, 34463.0, 21649.0, 13455.0, 8419.0, 5319.0, 3344.0, 2121.0, 1317.0, 869.0, 560.0, 340.0, 229.0, 165.0, 104.0, 53.0, 45.0, 23.0, 23.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.76708984375, -0.7433853149414062, -0.7196807861328125, -0.6959762573242188, -0.672271728515625, -0.6485671997070312, -0.6248626708984375, -0.6011581420898438, -0.57745361328125, -0.5537490844726562, -0.5300445556640625, -0.5063400268554688, -0.482635498046875, -0.45893096923828125, -0.4352264404296875, -0.41152191162109375, -0.3878173828125, -0.36411285400390625, -0.3404083251953125, -0.31670379638671875, -0.292999267578125, -0.26929473876953125, -0.2455902099609375, -0.22188568115234375, -0.19818115234375, -0.17447662353515625, -0.1507720947265625, -0.12706756591796875, -0.103363037109375, -0.07965850830078125, -0.0559539794921875, -0.03224945068359375, -0.008544921875, 0.01515960693359375, 0.0388641357421875, 0.06256866455078125, 0.086273193359375, 0.10997772216796875, 0.1336822509765625, 0.15738677978515625, 0.18109130859375, 0.20479583740234375, 0.2285003662109375, 0.25220489501953125, 0.275909423828125, 0.29961395263671875, 0.3233184814453125, 0.34702301025390625, 0.3707275390625, 0.39443206787109375, 0.4181365966796875, 0.44184112548828125, 0.465545654296875, 0.48925018310546875, 0.5129547119140625, 0.5366592407226562, 0.56036376953125, 0.5840682983398438, 0.6077728271484375, 0.6314773559570312, 0.655181884765625, 0.6788864135742188, 0.7025909423828125, 0.7262954711914062, 0.75]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 6.0, 2.0, 7.0, 7.0, 14.0, 8.0, 10.0, 24.0, 13.0, 18.0, 23.0, 33.0, 30.0, 28.0, 30.0, 24.0, 36.0, 37.0, 28.0, 35.0, 35.0, 1072.0, 43.0, 42.0, 51.0, 39.0, 43.0, 28.0, 37.0, 22.0, 30.0, 25.0, 27.0, 25.0, 12.0, 14.0, 12.0, 12.0, 8.0, 3.0, 9.0, 5.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3828125, -5.20819091796875, -5.0335693359375, -4.85894775390625, -4.684326171875, -4.50970458984375, -4.3350830078125, -4.16046142578125, -3.98583984375, -3.81121826171875, -3.6365966796875, -3.46197509765625, -3.287353515625, -3.11273193359375, -2.9381103515625, -2.76348876953125, -2.5888671875, -2.41424560546875, -2.2396240234375, -2.06500244140625, -1.890380859375, -1.71575927734375, -1.5411376953125, -1.36651611328125, -1.19189453125, -1.01727294921875, -0.8426513671875, -0.66802978515625, -0.493408203125, -0.31878662109375, -0.1441650390625, 0.03045654296875, 0.205078125, 0.37969970703125, 0.5543212890625, 0.72894287109375, 0.903564453125, 1.07818603515625, 1.2528076171875, 1.42742919921875, 1.60205078125, 1.77667236328125, 1.9512939453125, 2.12591552734375, 2.300537109375, 2.47515869140625, 2.6497802734375, 2.82440185546875, 2.9990234375, 3.17364501953125, 3.3482666015625, 3.52288818359375, 3.697509765625, 3.87213134765625, 4.0467529296875, 4.22137451171875, 4.39599609375, 4.57061767578125, 4.7452392578125, 4.91986083984375, 5.094482421875, 5.26910400390625, 5.4437255859375, 5.61834716796875, 5.79296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 7.0, 12.0, 19.0, 35.0, 50.0, 58.0, 105.0, 169.0, 274.0, 369.0, 580.0, 903.0, 1431.0, 2306.0, 3363.0, 5320.0, 8153.0, 12096.0, 18964.0, 29562.0, 45161.0, 70594.0, 108848.0, 156427.0, 1225780.0, 139834.0, 93794.0, 60715.0, 39320.0, 25464.0, 16421.0, 10900.0, 6989.0, 4616.0, 2940.0, 1894.0, 1318.0, 797.0, 548.0, 365.0, 215.0, 140.0, 92.0, 67.0, 42.0, 33.0, 20.0, 10.0, 4.0, 6.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.6181640625, -0.60015869140625, -0.5821533203125, -0.56414794921875, -0.546142578125, -0.52813720703125, -0.5101318359375, -0.49212646484375, -0.47412109375, -0.45611572265625, -0.4381103515625, -0.42010498046875, -0.402099609375, -0.38409423828125, -0.3660888671875, -0.34808349609375, -0.330078125, -0.31207275390625, -0.2940673828125, -0.27606201171875, -0.258056640625, -0.24005126953125, -0.2220458984375, -0.20404052734375, -0.18603515625, -0.16802978515625, -0.1500244140625, -0.13201904296875, -0.114013671875, -0.09600830078125, -0.0780029296875, -0.05999755859375, -0.0419921875, -0.02398681640625, -0.0059814453125, 0.01202392578125, 0.030029296875, 0.04803466796875, 0.0660400390625, 0.08404541015625, 0.10205078125, 0.12005615234375, 0.1380615234375, 0.15606689453125, 0.174072265625, 0.19207763671875, 0.2100830078125, 0.22808837890625, 0.24609375, 0.26409912109375, 0.2821044921875, 0.30010986328125, 0.318115234375, 0.33612060546875, 0.3541259765625, 0.37213134765625, 0.39013671875, 0.40814208984375, 0.4261474609375, 0.44415283203125, 0.462158203125, 0.48016357421875, 0.4981689453125, 0.51617431640625, 0.5341796875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 7.0, 12.0, 20.0, 14.0, 22.0, 25.0, 15.0, 24.0, 34.0, 44.0, 49.0, 68.0, 64.0, 61.0, 61.0, 74.0, 65.0, 67.0, 51.0, 36.0, 35.0, 34.0, 32.0, 20.0, 11.0, 14.0, 10.0, 6.0, 5.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0025310516357421875, -0.002453625202178955, -0.0023761987686157227, -0.0022987723350524902, -0.002221345901489258, -0.0021439194679260254, -0.002066493034362793, -0.0019890666007995605, -0.0019116401672363281, -0.0018342137336730957, -0.0017567873001098633, -0.0016793608665466309, -0.0016019344329833984, -0.001524507999420166, -0.0014470815658569336, -0.0013696551322937012, -0.0012922286987304688, -0.0012148022651672363, -0.001137375831604004, -0.0010599493980407715, -0.000982522964477539, -0.0009050965309143066, -0.0008276700973510742, -0.0007502436637878418, -0.0006728172302246094, -0.000595390796661377, -0.0005179643630981445, -0.0004405379295349121, -0.0003631114959716797, -0.00028568506240844727, -0.00020825862884521484, -0.00013083219528198242, -5.340576171875e-05, 2.4020671844482422e-05, 0.00010144710540771484, 0.00017887353897094727, 0.0002562999725341797, 0.0003337264060974121, 0.00041115283966064453, 0.000488579273223877, 0.0005660057067871094, 0.0006434321403503418, 0.0007208585739135742, 0.0007982850074768066, 0.0008757114410400391, 0.0009531378746032715, 0.001030564308166504, 0.0011079907417297363, 0.0011854171752929688, 0.0012628436088562012, 0.0013402700424194336, 0.001417696475982666, 0.0014951229095458984, 0.0015725493431091309, 0.0016499757766723633, 0.0017274022102355957, 0.0018048286437988281, 0.0018822550773620605, 0.001959681510925293, 0.0020371079444885254, 0.002114534378051758, 0.0021919608116149902, 0.0022693872451782227, 0.002346813678741455, 0.0024242401123046875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 10.0, 13.0, 15.0, 14.0, 25.0, 38.0, 40.0, 70.0, 82.0, 121.0, 173.0, 276.0, 565.0, 1134.0, 88656.0, 953666.0, 1864.0, 652.0, 386.0, 208.0, 132.0, 92.0, 58.0, 52.0, 46.0, 41.0, 38.0, 29.0, 13.0, 4.0, 2.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.046356201171875, -0.04486894607543945, -0.043381690979003906, -0.04189443588256836, -0.04040718078613281, -0.038919925689697266, -0.03743267059326172, -0.03594541549682617, -0.034458160400390625, -0.03297090530395508, -0.03148365020751953, -0.029996395111083984, -0.028509140014648438, -0.02702188491821289, -0.025534629821777344, -0.024047374725341797, -0.02256011962890625, -0.021072864532470703, -0.019585609436035156, -0.01809835433959961, -0.016611099243164062, -0.015123844146728516, -0.013636589050292969, -0.012149333953857422, -0.010662078857421875, -0.009174823760986328, -0.007687568664550781, -0.006200313568115234, -0.0047130584716796875, -0.0032258033752441406, -0.0017385482788085938, -0.0002512931823730469, 0.0012359619140625, 0.002723217010498047, 0.004210472106933594, 0.005697727203369141, 0.0071849822998046875, 0.008672237396240234, 0.010159492492675781, 0.011646747589111328, 0.013134002685546875, 0.014621257781982422, 0.01610851287841797, 0.017595767974853516, 0.019083023071289062, 0.02057027816772461, 0.022057533264160156, 0.023544788360595703, 0.02503204345703125, 0.026519298553466797, 0.028006553649902344, 0.02949380874633789, 0.030981063842773438, 0.032468318939208984, 0.03395557403564453, 0.03544282913208008, 0.036930084228515625, 0.03841733932495117, 0.03990459442138672, 0.041391849517822266, 0.04287910461425781, 0.04436635971069336, 0.045853614807128906, 0.04734086990356445, 0.048828125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 27.0, 71.0, 151.0, 275.0, 258.0, 139.0, 61.0, 16.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00186209287494421, -0.0017769852420315146, -0.001691877725534141, -0.0016067700926214457, -0.001521662576124072, -0.0014365549432113767, -0.0013514473102986813, -0.0012663397938013077, -0.0011812321608886123, -0.0010961245279759169, -0.0010110170114785433, -0.0009259093785658479, -0.0008408018038608134, -0.0007556942291557789, -0.0006705865962430835, -0.000585479021538049, -0.0005003714468330145, -0.00041526387212798, -0.00033015626831911504, -0.0002450486645102501, -0.0001599410898052156, -7.48335151001811e-05, 1.0274117812514305e-05, 9.53816925175488e-05, 0.0001804892672225833, 0.0002655968419276178, 0.00035070444573648274, 0.0004358120495453477, 0.0005209196242503822, 0.0006060271989554167, 0.0006911348318681121, 0.0007762424065731466, 0.0008613502141088247, 0.0009464577888138592, 0.0010315653635188937, 0.0011166729964315891, 0.0012017805129289627, 0.0012868881458416581, 0.0013719957787543535, 0.001457103295251727, 0.0015422109281644225, 0.001627318561077118, 0.0017124260775744915, 0.001797533710487187, 0.0018826413433998823, 0.001967748859897256, 0.002052856609225273, 0.0021379641257226467, 0.0022230716422200203, 0.002308179158717394, 0.002393286908045411, 0.0024783944245427847, 0.0025635019410401583, 0.0026486096903681755, 0.002733717206865549, 0.0028188247233629227, 0.0029039322398602962, 0.00298903975635767, 0.003074147505685687, 0.0031592550221830606, 0.0032443625386804342, 0.0033294702880084515, 0.003414577804505825, 0.0034996853210031986, 0.003584793070331216]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 8.0, 8.0, 3.0, 9.0, 6.0, 8.0, 14.0, 8.0, 23.0, 14.0, 18.0, 28.0, 33.0, 27.0, 37.0, 44.0, 36.0, 42.0, 37.0, 51.0, 45.0, 36.0, 35.0, 42.0, 41.0, 51.0, 40.0, 31.0, 43.0, 22.0, 28.0, 22.0, 19.0, 17.0, 20.0, 12.0, 9.0, 9.0, 9.0, 10.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001218259334564209, -0.0011798962950706482, -0.0011415332555770874, -0.0011031702160835266, -0.0010648071765899658, -0.001026444137096405, -0.0009880810976028442, -0.0009497180581092834, -0.0009113550186157227, -0.0008729919791221619, -0.0008346289396286011, -0.0007962659001350403, -0.0007579028606414795, -0.0007195398211479187, -0.0006811767816543579, -0.0006428137421607971, -0.0006044507026672363, -0.0005660876631736755, -0.0005277246236801147, -0.000489361584186554, -0.00045099854469299316, -0.0004126355051994324, -0.0003742724657058716, -0.0003359094262123108, -0.00029754638671875, -0.0002591833472251892, -0.00022082030773162842, -0.00018245726823806763, -0.00014409422874450684, -0.00010573118925094604, -6.736814975738525e-05, -2.9005110263824463e-05, 9.357929229736328e-06, 4.772096872329712e-05, 8.608400821685791e-05, 0.0001244470477104187, 0.0001628100872039795, 0.00020117312669754028, 0.00023953616619110107, 0.00027789920568466187, 0.00031626224517822266, 0.00035462528467178345, 0.00039298832416534424, 0.00043135136365890503, 0.0004697144031524658, 0.0005080774426460266, 0.0005464404821395874, 0.0005848035216331482, 0.000623166561126709, 0.0006615296006202698, 0.0006998926401138306, 0.0007382556796073914, 0.0007766187191009521, 0.0008149817585945129, 0.0008533447980880737, 0.0008917078375816345, 0.0009300708770751953, 0.0009684339165687561, 0.001006796956062317, 0.0010451599955558777, 0.0010835230350494385, 0.0011218860745429993, 0.00116024911403656, 0.0011986121535301208, 0.0012369751930236816]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 6.0, 7.0, 8.0, 8.0, 9.0, 13.0, 11.0, 18.0, 9.0, 14.0, 17.0, 20.0, 26.0, 20.0, 37.0, 32.0, 30.0, 29.0, 39.0, 48.0, 41.0, 48.0, 41.0, 39.0, 35.0, 40.0, 34.0, 39.0, 26.0, 30.0, 30.0, 26.0, 29.0, 20.0, 17.0, 13.0, 10.0, 15.0, 12.0, 11.0, 6.0, 5.0, 5.0, 4.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-8.7734375, -8.5087890625, -8.244140625, -7.9794921875, -7.71484375, -7.4501953125, -7.185546875, -6.9208984375, -6.65625, -6.3916015625, -6.126953125, -5.8623046875, -5.59765625, -5.3330078125, -5.068359375, -4.8037109375, -4.5390625, -4.2744140625, -4.009765625, -3.7451171875, -3.48046875, -3.2158203125, -2.951171875, -2.6865234375, -2.421875, -2.1572265625, -1.892578125, -1.6279296875, -1.36328125, -1.0986328125, -0.833984375, -0.5693359375, -0.3046875, -0.0400390625, 0.224609375, 0.4892578125, 0.75390625, 1.0185546875, 1.283203125, 1.5478515625, 1.8125, 2.0771484375, 2.341796875, 2.6064453125, 2.87109375, 3.1357421875, 3.400390625, 3.6650390625, 3.9296875, 4.1943359375, 4.458984375, 4.7236328125, 4.98828125, 5.2529296875, 5.517578125, 5.7822265625, 6.046875, 6.3115234375, 6.576171875, 6.8408203125, 7.10546875, 7.3701171875, 7.634765625, 7.8994140625, 8.1640625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 10.0, 12.0, 21.0, 8.0, 13.0, 24.0, 27.0, 36.0, 52.0, 67.0, 104.0, 101.0, 130.0, 162.0, 223.0, 301.0, 353.0, 438.0, 606.0, 833.0, 1188.0, 1819.0, 3931.0, 13343.0, 61184.0, 267144.0, 484489.0, 159775.0, 35424.0, 8145.0, 2838.0, 1573.0, 998.0, 710.0, 513.0, 411.0, 345.0, 285.0, 201.0, 150.0, 133.0, 106.0, 63.0, 51.0, 42.0, 44.0, 28.0, 15.0, 21.0, 14.0, 13.0, 12.0, 11.0, 8.0, 3.0, 4.0, 3.0], "bins": [-17.359375, -16.83837890625, -16.3173828125, -15.79638671875, -15.275390625, -14.75439453125, -14.2333984375, -13.71240234375, -13.19140625, -12.67041015625, -12.1494140625, -11.62841796875, -11.107421875, -10.58642578125, -10.0654296875, -9.54443359375, -9.0234375, -8.50244140625, -7.9814453125, -7.46044921875, -6.939453125, -6.41845703125, -5.8974609375, -5.37646484375, -4.85546875, -4.33447265625, -3.8134765625, -3.29248046875, -2.771484375, -2.25048828125, -1.7294921875, -1.20849609375, -0.6875, -0.16650390625, 0.3544921875, 0.87548828125, 1.396484375, 1.91748046875, 2.4384765625, 2.95947265625, 3.48046875, 4.00146484375, 4.5224609375, 5.04345703125, 5.564453125, 6.08544921875, 6.6064453125, 7.12744140625, 7.6484375, 8.16943359375, 8.6904296875, 9.21142578125, 9.732421875, 10.25341796875, 10.7744140625, 11.29541015625, 11.81640625, 12.33740234375, 12.8583984375, 13.37939453125, 13.900390625, 14.42138671875, 14.9423828125, 15.46337890625, 15.984375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 5.0, 7.0, 9.0, 11.0, 12.0, 10.0, 12.0, 17.0, 25.0, 21.0, 33.0, 35.0, 38.0, 45.0, 59.0, 84.0, 105.0, 200.0, 1403.0, 295.0, 144.0, 86.0, 50.0, 36.0, 41.0, 37.0, 35.0, 30.0, 18.0, 22.0, 22.0, 20.0, 15.0, 10.0, 12.0, 10.0, 7.0, 10.0, 5.0, 1.0, 2.0, 2.0, 2.0, 4.0], "bins": [-27.84375, -27.125244140625, -26.40673828125, -25.688232421875, -24.9697265625, -24.251220703125, -23.53271484375, -22.814208984375, -22.095703125, -21.377197265625, -20.65869140625, -19.940185546875, -19.2216796875, -18.503173828125, -17.78466796875, -17.066162109375, -16.34765625, -15.629150390625, -14.91064453125, -14.192138671875, -13.4736328125, -12.755126953125, -12.03662109375, -11.318115234375, -10.599609375, -9.881103515625, -9.16259765625, -8.444091796875, -7.7255859375, -7.007080078125, -6.28857421875, -5.570068359375, -4.8515625, -4.133056640625, -3.41455078125, -2.696044921875, -1.9775390625, -1.259033203125, -0.54052734375, 0.177978515625, 0.896484375, 1.614990234375, 2.33349609375, 3.052001953125, 3.7705078125, 4.489013671875, 5.20751953125, 5.926025390625, 6.64453125, 7.363037109375, 8.08154296875, 8.800048828125, 9.5185546875, 10.237060546875, 10.95556640625, 11.674072265625, 12.392578125, 13.111083984375, 13.82958984375, 14.548095703125, 15.2666015625, 15.985107421875, 16.70361328125, 17.422119140625, 18.140625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 11.0, 7.0, 10.0, 9.0, 11.0, 12.0, 22.0, 14.0, 29.0, 28.0, 37.0, 58.0, 89.0, 118.0, 158.0, 198.0, 293.0, 597.0, 1167.0, 6187.0, 3126867.0, 6800.0, 1299.0, 545.0, 323.0, 195.0, 157.0, 126.0, 72.0, 63.0, 46.0, 36.0, 28.0, 13.0, 19.0, 9.0, 7.0, 8.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-111.25, -107.828125, -104.40625, -100.984375, -97.5625, -94.140625, -90.71875, -87.296875, -83.875, -80.453125, -77.03125, -73.609375, -70.1875, -66.765625, -63.34375, -59.921875, -56.5, -53.078125, -49.65625, -46.234375, -42.8125, -39.390625, -35.96875, -32.546875, -29.125, -25.703125, -22.28125, -18.859375, -15.4375, -12.015625, -8.59375, -5.171875, -1.75, 1.671875, 5.09375, 8.515625, 11.9375, 15.359375, 18.78125, 22.203125, 25.625, 29.046875, 32.46875, 35.890625, 39.3125, 42.734375, 46.15625, 49.578125, 53.0, 56.421875, 59.84375, 63.265625, 66.6875, 70.109375, 73.53125, 76.953125, 80.375, 83.796875, 87.21875, 90.640625, 94.0625, 97.484375, 100.90625, 104.328125, 107.75]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 11.0, 51.0, 139.0, 250.0, 271.0, 186.0, 78.0, 17.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.3551483154297, -143.85218811035156, -140.3492431640625, -136.84628295898438, -133.3433380126953, -129.8403778076172, -126.33743286132812, -122.83447265625, -119.33152770996094, -115.82857513427734, -112.32562255859375, -108.82266998291016, -105.31971740722656, -101.81676483154297, -98.31381225585938, -94.81085205078125, -91.30789947509766, -87.80494689941406, -84.30199432373047, -80.79904174804688, -77.29608917236328, -73.79313659667969, -70.29017639160156, -66.7872314453125, -63.28427505493164, -59.78132247924805, -56.27836990356445, -52.775413513183594, -49.2724609375, -45.769508361816406, -42.26655578613281, -38.76360321044922, -35.260650634765625, -31.75769805908203, -28.254745483398438, -24.75179100036621, -21.248838424682617, -17.745885848999023, -14.242931365966797, -10.739978790283203, -7.237026214599609, -3.7340731620788574, -0.23112010955810547, 3.2718334197998047, 6.774785995483398, 10.277738571166992, 13.780693054199219, 17.283645629882812, 20.786598205566406, 24.28955078125, 27.792503356933594, 31.29545783996582, 34.79840850830078, 38.301361083984375, 41.804317474365234, 45.30727005004883, 48.81022262573242, 52.313175201416016, 55.81612777709961, 59.31908416748047, 62.82203674316406, 66.32498931884766, 69.82794189453125, 73.33089447021484, 76.83384704589844]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 9.0, 10.0, 14.0, 18.0, 19.0, 24.0, 14.0, 18.0, 34.0, 29.0, 41.0, 37.0, 37.0, 47.0, 48.0, 49.0, 47.0, 50.0, 39.0, 39.0, 55.0, 42.0, 38.0, 15.0, 35.0, 28.0, 25.0, 17.0, 22.0, 22.0, 9.0, 5.0, 8.0, 10.0, 9.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.86651611328125, -55.76604080200195, -53.665565490722656, -51.56509017944336, -49.46461486816406, -47.36414337158203, -45.263668060302734, -43.16319274902344, -41.06271743774414, -38.962242126464844, -36.86176681518555, -34.76129150390625, -32.66082000732422, -30.56034278869629, -28.459869384765625, -26.359394073486328, -24.25891876220703, -22.158443450927734, -20.057968139648438, -17.957494735717773, -15.857019424438477, -13.75654411315918, -11.6560697555542, -9.555595397949219, -7.455120086669922, -5.354645252227783, -3.2541704177856445, -1.1536955833435059, 0.9467792510986328, 3.0472545623779297, 5.14772891998291, 7.248203277587891, 9.348678588867188, 11.449153900146484, 13.549628257751465, 15.650102615356445, 17.750577926635742, 19.85105323791504, 21.951526641845703, 24.052001953125, 26.152477264404297, 28.252952575683594, 30.35342788696289, 32.45390319824219, 34.55437469482422, 36.65485382080078, 38.75532531738281, 40.85580062866211, 42.956275939941406, 45.0567512512207, 47.1572265625, 49.2577018737793, 51.358177185058594, 53.458648681640625, 55.55912399291992, 57.65959930419922, 59.760074615478516, 61.86054992675781, 63.96102523803711, 66.0615005493164, 68.16197204589844, 70.262451171875, 72.36292266845703, 74.46339416503906, 76.56387329101562]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 3.0, 7.0, 5.0, 6.0, 8.0, 6.0, 9.0, 10.0, 6.0, 9.0, 10.0, 12.0, 18.0, 13.0, 27.0, 27.0, 32.0, 28.0, 38.0, 30.0, 38.0, 43.0, 53.0, 36.0, 37.0, 41.0, 40.0, 37.0, 36.0, 30.0, 36.0, 25.0, 28.0, 28.0, 29.0, 28.0, 17.0, 18.0, 13.0, 11.0, 23.0, 10.0, 7.0, 5.0, 6.0, 2.0, 5.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.8671875, -8.6043701171875, -8.341552734375, -8.0787353515625, -7.81591796875, -7.5531005859375, -7.290283203125, -7.0274658203125, -6.7646484375, -6.5018310546875, -6.239013671875, -5.9761962890625, -5.71337890625, -5.4505615234375, -5.187744140625, -4.9249267578125, -4.662109375, -4.3992919921875, -4.136474609375, -3.8736572265625, -3.61083984375, -3.3480224609375, -3.085205078125, -2.8223876953125, -2.5595703125, -2.2967529296875, -2.033935546875, -1.7711181640625, -1.50830078125, -1.2454833984375, -0.982666015625, -0.7198486328125, -0.45703125, -0.1942138671875, 0.068603515625, 0.3314208984375, 0.59423828125, 0.8570556640625, 1.119873046875, 1.3826904296875, 1.6455078125, 1.9083251953125, 2.171142578125, 2.4339599609375, 2.69677734375, 2.9595947265625, 3.222412109375, 3.4852294921875, 3.748046875, 4.0108642578125, 4.273681640625, 4.5364990234375, 4.79931640625, 5.0621337890625, 5.324951171875, 5.5877685546875, 5.8505859375, 6.1134033203125, 6.376220703125, 6.6390380859375, 6.90185546875, 7.1646728515625, 7.427490234375, 7.6903076171875, 7.953125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 6.0, 12.0, 21.0, 38.0, 64.0, 112.0, 225.0, 421.0, 982.0, 2540.0, 9752.0, 78476.0, 1185451.0, 2583370.0, 302907.0, 22939.0, 4408.0, 1363.0, 595.0, 272.0, 151.0, 71.0, 36.0, 23.0, 17.0, 3.0, 8.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.96875, -19.235595703125, -18.50244140625, -17.769287109375, -17.0361328125, -16.302978515625, -15.56982421875, -14.836669921875, -14.103515625, -13.370361328125, -12.63720703125, -11.904052734375, -11.1708984375, -10.437744140625, -9.70458984375, -8.971435546875, -8.23828125, -7.505126953125, -6.77197265625, -6.038818359375, -5.3056640625, -4.572509765625, -3.83935546875, -3.106201171875, -2.373046875, -1.639892578125, -0.90673828125, -0.173583984375, 0.5595703125, 1.292724609375, 2.02587890625, 2.759033203125, 3.4921875, 4.225341796875, 4.95849609375, 5.691650390625, 6.4248046875, 7.157958984375, 7.89111328125, 8.624267578125, 9.357421875, 10.090576171875, 10.82373046875, 11.556884765625, 12.2900390625, 13.023193359375, 13.75634765625, 14.489501953125, 15.22265625, 15.955810546875, 16.68896484375, 17.422119140625, 18.1552734375, 18.888427734375, 19.62158203125, 20.354736328125, 21.087890625, 21.821044921875, 22.55419921875, 23.287353515625, 24.0205078125, 24.753662109375, 25.48681640625, 26.219970703125, 26.953125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 8.0, 2.0, 7.0, 11.0, 16.0, 22.0, 29.0, 40.0, 50.0, 72.0, 92.0, 105.0, 138.0, 187.0, 284.0, 331.0, 485.0, 487.0, 411.0, 338.0, 217.0, 193.0, 141.0, 109.0, 71.0, 65.0, 44.0, 28.0, 23.0, 16.0, 19.0, 7.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.3125, -15.80908203125, -15.3056640625, -14.80224609375, -14.298828125, -13.79541015625, -13.2919921875, -12.78857421875, -12.28515625, -11.78173828125, -11.2783203125, -10.77490234375, -10.271484375, -9.76806640625, -9.2646484375, -8.76123046875, -8.2578125, -7.75439453125, -7.2509765625, -6.74755859375, -6.244140625, -5.74072265625, -5.2373046875, -4.73388671875, -4.23046875, -3.72705078125, -3.2236328125, -2.72021484375, -2.216796875, -1.71337890625, -1.2099609375, -0.70654296875, -0.203125, 0.30029296875, 0.8037109375, 1.30712890625, 1.810546875, 2.31396484375, 2.8173828125, 3.32080078125, 3.82421875, 4.32763671875, 4.8310546875, 5.33447265625, 5.837890625, 6.34130859375, 6.8447265625, 7.34814453125, 7.8515625, 8.35498046875, 8.8583984375, 9.36181640625, 9.865234375, 10.36865234375, 10.8720703125, 11.37548828125, 11.87890625, 12.38232421875, 12.8857421875, 13.38916015625, 13.892578125, 14.39599609375, 14.8994140625, 15.40283203125, 15.90625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 7.0, 10.0, 20.0, 21.0, 29.0, 32.0, 60.0, 78.0, 131.0, 176.0, 257.0, 405.0, 653.0, 1194.0, 2283.0, 6404.0, 41260.0, 509163.0, 3123225.0, 459833.0, 37578.0, 6117.0, 2252.0, 1112.0, 729.0, 419.0, 276.0, 140.0, 134.0, 81.0, 54.0, 43.0, 23.0, 22.0, 12.0, 13.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.328125, -24.54833984375, -23.7685546875, -22.98876953125, -22.208984375, -21.42919921875, -20.6494140625, -19.86962890625, -19.08984375, -18.31005859375, -17.5302734375, -16.75048828125, -15.970703125, -15.19091796875, -14.4111328125, -13.63134765625, -12.8515625, -12.07177734375, -11.2919921875, -10.51220703125, -9.732421875, -8.95263671875, -8.1728515625, -7.39306640625, -6.61328125, -5.83349609375, -5.0537109375, -4.27392578125, -3.494140625, -2.71435546875, -1.9345703125, -1.15478515625, -0.375, 0.40478515625, 1.1845703125, 1.96435546875, 2.744140625, 3.52392578125, 4.3037109375, 5.08349609375, 5.86328125, 6.64306640625, 7.4228515625, 8.20263671875, 8.982421875, 9.76220703125, 10.5419921875, 11.32177734375, 12.1015625, 12.88134765625, 13.6611328125, 14.44091796875, 15.220703125, 16.00048828125, 16.7802734375, 17.56005859375, 18.33984375, 19.11962890625, 19.8994140625, 20.67919921875, 21.458984375, 22.23876953125, 23.0185546875, 23.79833984375, 24.578125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 58.0, 195.0, 344.0, 268.0, 111.0, 25.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.53214263916016, -83.48588562011719, -77.43962097167969, -71.39336395263672, -65.34710693359375, -59.300846099853516, -53.25458526611328, -47.20832824707031, -41.16206741333008, -35.115806579589844, -29.069549560546875, -23.02328872680664, -16.97702980041504, -10.930770874023438, -4.884510040283203, 1.1617469787597656, 7.2080078125, 13.254266738891602, 19.300525665283203, 25.346786499023438, 31.39304542541504, 37.43930435180664, 43.485565185546875, 49.531822204589844, 55.57808303833008, 61.62434387207031, 67.67060089111328, 73.71685791015625, 79.76312255859375, 85.80937957763672, 91.85563659667969, 97.90190124511719, 103.94816589355469, 109.99442291259766, 116.04068756103516, 122.08694458007812, 128.13320922851562, 134.17945861816406, 140.22572326660156, 146.27197265625, 152.3182373046875, 158.364501953125, 164.41075134277344, 170.45701599121094, 176.50328063964844, 182.54953002929688, 188.59579467773438, 194.64205932617188, 200.68832397460938, 206.73458862304688, 212.7808380126953, 218.8271026611328, 224.8733673095703, 230.91961669921875, 236.96588134765625, 243.01214599609375, 249.0583953857422, 255.1046600341797, 261.1509094238281, 267.1971740722656, 273.2434387207031, 279.2897033691406, 285.3359375, 291.3822021484375, 297.428466796875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 7.0, 7.0, 3.0, 4.0, 3.0, 12.0, 7.0, 10.0, 11.0, 16.0, 12.0, 15.0, 25.0, 27.0, 20.0, 16.0, 28.0, 29.0, 39.0, 25.0, 40.0, 49.0, 49.0, 40.0, 38.0, 52.0, 38.0, 44.0, 30.0, 37.0, 35.0, 31.0, 30.0, 24.0, 25.0, 21.0, 17.0, 11.0, 17.0, 19.0, 14.0, 5.0, 5.0, 9.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.56891632080078, -59.69052505493164, -57.8121337890625, -55.93374252319336, -54.05535125732422, -52.17695999145508, -50.29856872558594, -48.42017364501953, -46.541786193847656, -44.663394927978516, -42.785003662109375, -40.906612396240234, -39.028221130371094, -37.14982986450195, -35.27143859863281, -33.393043518066406, -31.514652252197266, -29.636260986328125, -27.757869720458984, -25.879478454589844, -24.001087188720703, -22.122695922851562, -20.24430274963379, -18.36591148376465, -16.487520217895508, -14.609128952026367, -12.730737686157227, -10.85234546661377, -8.973954200744629, -7.095562934875488, -5.217170715332031, -3.3387794494628906, -1.46038818359375, 0.4180033206939697, 2.2963948249816895, 4.174786567687988, 6.053177833557129, 7.9315690994262695, 9.809961318969727, 11.688352584838867, 13.566743850708008, 15.445135116577148, 17.32352638244629, 19.201919555664062, 21.080310821533203, 22.958702087402344, 24.837093353271484, 26.715484619140625, 28.593875885009766, 30.472267150878906, 32.35065841674805, 34.22904968261719, 36.10744094848633, 37.98583221435547, 39.864227294921875, 41.74261474609375, 43.621009826660156, 45.4994010925293, 47.37779235839844, 49.25618362426758, 51.13457489013672, 53.01296615600586, 54.891357421875, 56.769752502441406, 58.64813995361328]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 4.0, 8.0, 11.0, 13.0, 12.0, 19.0, 11.0, 14.0, 19.0, 21.0, 28.0, 27.0, 30.0, 30.0, 36.0, 42.0, 45.0, 34.0, 31.0, 31.0, 44.0, 37.0, 34.0, 36.0, 30.0, 41.0, 25.0, 34.0, 31.0, 27.0, 23.0, 25.0, 25.0, 25.0, 20.0, 10.0, 7.0, 7.0, 6.0, 8.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.18359375, -5.98553466796875, -5.7874755859375, -5.58941650390625, -5.391357421875, -5.19329833984375, -4.9952392578125, -4.79718017578125, -4.59912109375, -4.40106201171875, -4.2030029296875, -4.00494384765625, -3.806884765625, -3.60882568359375, -3.4107666015625, -3.21270751953125, -3.0146484375, -2.81658935546875, -2.6185302734375, -2.42047119140625, -2.222412109375, -2.02435302734375, -1.8262939453125, -1.62823486328125, -1.43017578125, -1.23211669921875, -1.0340576171875, -0.83599853515625, -0.637939453125, -0.43988037109375, -0.2418212890625, -0.04376220703125, 0.154296875, 0.35235595703125, 0.5504150390625, 0.74847412109375, 0.946533203125, 1.14459228515625, 1.3426513671875, 1.54071044921875, 1.73876953125, 1.93682861328125, 2.1348876953125, 2.33294677734375, 2.531005859375, 2.72906494140625, 2.9271240234375, 3.12518310546875, 3.3232421875, 3.52130126953125, 3.7193603515625, 3.91741943359375, 4.115478515625, 4.31353759765625, 4.5115966796875, 4.70965576171875, 4.90771484375, 5.10577392578125, 5.3038330078125, 5.50189208984375, 5.699951171875, 5.89801025390625, 6.0960693359375, 6.29412841796875, 6.4921875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 8.0, 10.0, 13.0, 29.0, 37.0, 55.0, 80.0, 109.0, 179.0, 260.0, 380.0, 560.0, 840.0, 1293.0, 1916.0, 2795.0, 4474.0, 6692.0, 10641.0, 16623.0, 26038.0, 40787.0, 64357.0, 100521.0, 156352.0, 196660.0, 149996.0, 96402.0, 61561.0, 39152.0, 24912.0, 15766.0, 9932.0, 6509.0, 4316.0, 2786.0, 1839.0, 1248.0, 771.0, 544.0, 356.0, 250.0, 171.0, 120.0, 75.0, 52.0, 31.0, 19.0, 18.0, 9.0, 7.0, 4.0, 2.0, 4.0, 3.0], "bins": [-0.56298828125, -0.5466461181640625, -0.530303955078125, -0.5139617919921875, -0.49761962890625, -0.4812774658203125, -0.464935302734375, -0.4485931396484375, -0.4322509765625, -0.4159088134765625, -0.399566650390625, -0.3832244873046875, -0.36688232421875, -0.3505401611328125, -0.334197998046875, -0.3178558349609375, -0.301513671875, -0.2851715087890625, -0.268829345703125, -0.2524871826171875, -0.23614501953125, -0.2198028564453125, -0.203460693359375, -0.1871185302734375, -0.1707763671875, -0.1544342041015625, -0.138092041015625, -0.1217498779296875, -0.10540771484375, -0.0890655517578125, -0.072723388671875, -0.0563812255859375, -0.0400390625, -0.0236968994140625, -0.007354736328125, 0.0089874267578125, 0.02532958984375, 0.0416717529296875, 0.058013916015625, 0.0743560791015625, 0.0906982421875, 0.1070404052734375, 0.123382568359375, 0.1397247314453125, 0.15606689453125, 0.1724090576171875, 0.188751220703125, 0.2050933837890625, 0.221435546875, 0.2377777099609375, 0.254119873046875, 0.2704620361328125, 0.28680419921875, 0.3031463623046875, 0.319488525390625, 0.3358306884765625, 0.3521728515625, 0.3685150146484375, 0.384857177734375, 0.4011993408203125, 0.41754150390625, 0.4338836669921875, 0.450225830078125, 0.4665679931640625, 0.48291015625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 11.0, 7.0, 5.0, 12.0, 24.0, 19.0, 24.0, 28.0, 26.0, 24.0, 32.0, 28.0, 35.0, 47.0, 35.0, 37.0, 61.0, 1074.0, 41.0, 45.0, 39.0, 41.0, 30.0, 37.0, 31.0, 37.0, 36.0, 26.0, 8.0, 13.0, 22.0, 11.0, 16.0, 5.0, 10.0, 14.0, 4.0, 6.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.25, -4.11053466796875, -3.9710693359375, -3.83160400390625, -3.692138671875, -3.55267333984375, -3.4132080078125, -3.27374267578125, -3.13427734375, -2.99481201171875, -2.8553466796875, -2.71588134765625, -2.576416015625, -2.43695068359375, -2.2974853515625, -2.15802001953125, -2.0185546875, -1.87908935546875, -1.7396240234375, -1.60015869140625, -1.460693359375, -1.32122802734375, -1.1817626953125, -1.04229736328125, -0.90283203125, -0.76336669921875, -0.6239013671875, -0.48443603515625, -0.344970703125, -0.20550537109375, -0.0660400390625, 0.07342529296875, 0.212890625, 0.35235595703125, 0.4918212890625, 0.63128662109375, 0.770751953125, 0.91021728515625, 1.0496826171875, 1.18914794921875, 1.32861328125, 1.46807861328125, 1.6075439453125, 1.74700927734375, 1.886474609375, 2.02593994140625, 2.1654052734375, 2.30487060546875, 2.4443359375, 2.58380126953125, 2.7232666015625, 2.86273193359375, 3.002197265625, 3.14166259765625, 3.2811279296875, 3.42059326171875, 3.56005859375, 3.69952392578125, 3.8389892578125, 3.97845458984375, 4.117919921875, 4.25738525390625, 4.3968505859375, 4.53631591796875, 4.67578125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 14.0, 22.0, 26.0, 47.0, 67.0, 91.0, 151.0, 188.0, 279.0, 434.0, 617.0, 880.0, 1399.0, 1990.0, 2922.0, 4452.0, 6413.0, 9420.0, 14091.0, 21004.0, 31705.0, 48097.0, 72919.0, 110752.0, 157423.0, 1219555.0, 131620.0, 88109.0, 57745.0, 37732.0, 25343.0, 16898.0, 11207.0, 7770.0, 5167.0, 3405.0, 2399.0, 1575.0, 1019.0, 716.0, 463.0, 334.0, 235.0, 136.0, 101.0, 73.0, 42.0, 29.0, 17.0, 16.0, 7.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.418701171875, -0.4052886962890625, -0.391876220703125, -0.3784637451171875, -0.36505126953125, -0.3516387939453125, -0.338226318359375, -0.3248138427734375, -0.3114013671875, -0.2979888916015625, -0.284576416015625, -0.2711639404296875, -0.25775146484375, -0.2443389892578125, -0.230926513671875, -0.2175140380859375, -0.2041015625, -0.1906890869140625, -0.177276611328125, -0.1638641357421875, -0.15045166015625, -0.1370391845703125, -0.123626708984375, -0.1102142333984375, -0.0968017578125, -0.0833892822265625, -0.069976806640625, -0.0565643310546875, -0.04315185546875, -0.0297393798828125, -0.016326904296875, -0.0029144287109375, 0.010498046875, 0.0239105224609375, 0.037322998046875, 0.0507354736328125, 0.06414794921875, 0.0775604248046875, 0.090972900390625, 0.1043853759765625, 0.1177978515625, 0.1312103271484375, 0.144622802734375, 0.1580352783203125, 0.17144775390625, 0.1848602294921875, 0.198272705078125, 0.2116851806640625, 0.22509765625, 0.2385101318359375, 0.251922607421875, 0.2653350830078125, 0.27874755859375, 0.2921600341796875, 0.305572509765625, 0.3189849853515625, 0.3323974609375, 0.3458099365234375, 0.359222412109375, 0.3726348876953125, 0.38604736328125, 0.3994598388671875, 0.412872314453125, 0.4262847900390625, 0.439697265625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 6.0, 6.0, 3.0, 8.0, 2.0, 15.0, 14.0, 14.0, 11.0, 23.0, 18.0, 34.0, 29.0, 22.0, 34.0, 35.0, 35.0, 37.0, 39.0, 52.0, 39.0, 53.0, 36.0, 30.0, 43.0, 44.0, 30.0, 33.0, 34.0, 37.0, 25.0, 20.0, 17.0, 25.0, 23.0, 13.0, 9.0, 14.0, 13.0, 8.0, 1.0, 5.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009455680847167969, -0.0009166374802589417, -0.0008877068758010864, -0.0008587762713432312, -0.000829845666885376, -0.0008009150624275208, -0.0007719844579696655, -0.0007430538535118103, -0.0007141232490539551, -0.0006851926445960999, -0.0006562620401382446, -0.0006273314356803894, -0.0005984008312225342, -0.000569470226764679, -0.0005405396223068237, -0.0005116090178489685, -0.0004826784133911133, -0.00045374780893325806, -0.00042481720447540283, -0.0003958866000175476, -0.0003669559955596924, -0.00033802539110183716, -0.00030909478664398193, -0.0002801641821861267, -0.0002512335777282715, -0.00022230297327041626, -0.00019337236881256104, -0.0001644417643547058, -0.00013551115989685059, -0.00010658055543899536, -7.764995098114014e-05, -4.871934652328491e-05, -1.9788742065429688e-05, 9.141862392425537e-06, 3.807246685028076e-05, 6.700307130813599e-05, 9.593367576599121e-05, 0.00012486428022384644, 0.00015379488468170166, 0.00018272548913955688, 0.0002116560935974121, 0.00024058669805526733, 0.00026951730251312256, 0.0002984479069709778, 0.000327378511428833, 0.00035630911588668823, 0.00038523972034454346, 0.0004141703248023987, 0.0004431009292602539, 0.00047203153371810913, 0.0005009621381759644, 0.0005298927426338196, 0.0005588233470916748, 0.00058775395154953, 0.0006166845560073853, 0.0006456151604652405, 0.0006745457649230957, 0.0007034763693809509, 0.0007324069738388062, 0.0007613375782966614, 0.0007902681827545166, 0.0008191987872123718, 0.000848129391670227, 0.0008770599961280823, 0.0009059906005859375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 10.0, 12.0, 20.0, 19.0, 21.0, 26.0, 43.0, 48.0, 40.0, 58.0, 73.0, 95.0, 150.0, 199.0, 339.0, 469.0, 809.0, 3201.0, 374313.0, 660854.0, 5094.0, 908.0, 503.0, 317.0, 228.0, 136.0, 119.0, 92.0, 74.0, 61.0, 37.0, 36.0, 28.0, 22.0, 19.0, 20.0, 8.0, 9.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.019439697265625, -0.01885199546813965, -0.018264293670654297, -0.017676591873168945, -0.017088890075683594, -0.016501188278198242, -0.01591348648071289, -0.015325784683227539, -0.014738082885742188, -0.014150381088256836, -0.013562679290771484, -0.012974977493286133, -0.012387275695800781, -0.01179957389831543, -0.011211872100830078, -0.010624170303344727, -0.010036468505859375, -0.009448766708374023, -0.008861064910888672, -0.00827336311340332, -0.007685661315917969, -0.007097959518432617, -0.006510257720947266, -0.005922555923461914, -0.0053348541259765625, -0.004747152328491211, -0.004159450531005859, -0.003571748733520508, -0.0029840469360351562, -0.0023963451385498047, -0.0018086433410644531, -0.0012209415435791016, -0.00063323974609375, -4.553794860839844e-05, 0.0005421638488769531, 0.0011298656463623047, 0.0017175674438476562, 0.002305269241333008, 0.0028929710388183594, 0.003480672836303711, 0.0040683746337890625, 0.004656076431274414, 0.005243778228759766, 0.005831480026245117, 0.006419181823730469, 0.00700688362121582, 0.007594585418701172, 0.008182287216186523, 0.008769989013671875, 0.009357690811157227, 0.009945392608642578, 0.01053309440612793, 0.011120796203613281, 0.011708498001098633, 0.012296199798583984, 0.012883901596069336, 0.013471603393554688, 0.014059305191040039, 0.01464700698852539, 0.015234708786010742, 0.015822410583496094, 0.016410112380981445, 0.016997814178466797, 0.01758551597595215, 0.0181732177734375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 44.0, 737.0, 235.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006766138132661581, -0.006522041745483875, -0.006277945823967457, -0.006033849436789751, -0.005789753515273333, -0.005545657128095627, -0.005301561206579208, -0.005057464819401503, -0.004813368432223797, -0.004569272045046091, -0.004325176123529673, -0.004081079736351967, -0.0038369838148355484, -0.0035928874276578426, -0.0033487912733107805, -0.0031046951189637184, -0.0028605991974473, -0.002616503043100238, -0.0023724068887531757, -0.00212831050157547, -0.0018842144636437297, -0.0016401183092966676, -0.0013960220385342836, -0.0011519258841872215, -0.0009078297298401594, -0.0006637335754930973, -0.0004196373629383743, -0.00017554115038365126, 6.855500396341085e-05, 0.00031265115831047297, 0.0005567474290728569, 0.000800843583419919, 0.0010449392721056938, 0.001289035426452756, 0.001533131580799818, 0.001777227851562202, 0.0020213238894939423, 0.002265420276671648, 0.00250951643101871, 0.0027536125853657722, 0.0029977087397128344, 0.0032418048940598965, 0.0034859010484069586, 0.0037299972027540207, 0.0039740935899317265, 0.004218189511448145, 0.004462285898625851, 0.004706381820142269, 0.004950478207319975, 0.005194574594497681, 0.005438670516014099, 0.005682766903191805, 0.005926862824708223, 0.006170959211885929, 0.0064150551334023476, 0.006659151520580053, 0.006903247907757759, 0.007147344294935465, 0.007391440216451883, 0.007635536603629589, 0.007879632525146008, 0.008123728446662426, 0.008367825299501419, 0.008611921221017838, 0.008856017142534256]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 8.0, 9.0, 4.0, 6.0, 6.0, 14.0, 10.0, 9.0, 16.0, 12.0, 21.0, 16.0, 26.0, 24.0, 34.0, 32.0, 29.0, 26.0, 30.0, 35.0, 36.0, 39.0, 32.0, 29.0, 40.0, 33.0, 35.0, 33.0, 37.0, 26.0, 30.0, 18.0, 28.0, 31.0, 24.0, 19.0, 17.0, 21.0, 12.0, 12.0, 14.0, 10.0, 13.0, 9.0, 4.0, 6.0, 7.0, 6.0, 7.0, 1.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.0005356669425964355, -0.0005198512226343155, -0.0005040355026721954, -0.0004882197827100754, -0.0004724040627479553, -0.00045658834278583527, -0.0004407726228237152, -0.00042495690286159515, -0.0004091411828994751, -0.00039332546293735504, -0.000377509742975235, -0.00036169402301311493, -0.0003458783030509949, -0.0003300625830888748, -0.00031424686312675476, -0.0002984311431646347, -0.00028261542320251465, -0.0002667997032403946, -0.00025098398327827454, -0.00023516826331615448, -0.00021935254335403442, -0.00020353682339191437, -0.0001877211034297943, -0.00017190538346767426, -0.0001560896635055542, -0.00014027394354343414, -0.0001244582235813141, -0.00010864250361919403, -9.282678365707397e-05, -7.701106369495392e-05, -6.119534373283386e-05, -4.5379623770713806e-05, -2.956390380859375e-05, -1.3748183846473694e-05, 2.0675361156463623e-06, 1.788325607776642e-05, 3.3698976039886475e-05, 4.951469600200653e-05, 6.533041596412659e-05, 8.114613592624664e-05, 9.69618558883667e-05, 0.00011277757585048676, 0.0001285932958126068, 0.00014440901577472687, 0.00016022473573684692, 0.00017604045569896698, 0.00019185617566108704, 0.0002076718956232071, 0.00022348761558532715, 0.0002393033355474472, 0.00025511905550956726, 0.0002709347754716873, 0.0002867504954338074, 0.00030256621539592743, 0.0003183819353580475, 0.00033419765532016754, 0.0003500133752822876, 0.00036582909524440765, 0.0003816448152065277, 0.00039746053516864777, 0.0004132762551307678, 0.0004290919750928879, 0.00044490769505500793, 0.000460723415017128, 0.00047653913497924805]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 4.0, 8.0, 11.0, 13.0, 12.0, 19.0, 11.0, 14.0, 19.0, 21.0, 28.0, 27.0, 30.0, 30.0, 36.0, 42.0, 45.0, 34.0, 31.0, 31.0, 44.0, 37.0, 34.0, 36.0, 30.0, 41.0, 25.0, 33.0, 32.0, 27.0, 23.0, 25.0, 25.0, 25.0, 20.0, 10.0, 7.0, 7.0, 6.0, 8.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.18359375, -5.98553466796875, -5.7874755859375, -5.58941650390625, -5.391357421875, -5.19329833984375, -4.9952392578125, -4.79718017578125, -4.59912109375, -4.40106201171875, -4.2030029296875, -4.00494384765625, -3.806884765625, -3.60882568359375, -3.4107666015625, -3.21270751953125, -3.0146484375, -2.81658935546875, -2.6185302734375, -2.42047119140625, -2.222412109375, -2.02435302734375, -1.8262939453125, -1.62823486328125, -1.43017578125, -1.23211669921875, -1.0340576171875, -0.83599853515625, -0.637939453125, -0.43988037109375, -0.2418212890625, -0.04376220703125, 0.154296875, 0.35235595703125, 0.5504150390625, 0.74847412109375, 0.946533203125, 1.14459228515625, 1.3426513671875, 1.54071044921875, 1.73876953125, 1.93682861328125, 2.1348876953125, 2.33294677734375, 2.531005859375, 2.72906494140625, 2.9271240234375, 3.12518310546875, 3.3232421875, 3.52130126953125, 3.7193603515625, 3.91741943359375, 4.115478515625, 4.31353759765625, 4.5115966796875, 4.70965576171875, 4.90771484375, 5.10577392578125, 5.3038330078125, 5.50189208984375, 5.699951171875, 5.89801025390625, 6.0960693359375, 6.29412841796875, 6.4921875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 7.0, 6.0, 6.0, 13.0, 9.0, 19.0, 24.0, 36.0, 47.0, 50.0, 68.0, 78.0, 120.0, 141.0, 185.0, 236.0, 307.0, 377.0, 522.0, 692.0, 883.0, 1114.0, 1417.0, 2095.0, 3114.0, 5982.0, 20127.0, 109253.0, 579720.0, 255513.0, 42727.0, 9911.0, 3974.0, 2446.0, 1749.0, 1313.0, 999.0, 692.0, 588.0, 467.0, 346.0, 279.0, 219.0, 152.0, 123.0, 99.0, 79.0, 56.0, 50.0, 38.0, 28.0, 19.0, 17.0, 9.0, 11.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0], "bins": [-15.3984375, -14.9132080078125, -14.427978515625, -13.9427490234375, -13.45751953125, -12.9722900390625, -12.487060546875, -12.0018310546875, -11.5166015625, -11.0313720703125, -10.546142578125, -10.0609130859375, -9.57568359375, -9.0904541015625, -8.605224609375, -8.1199951171875, -7.634765625, -7.1495361328125, -6.664306640625, -6.1790771484375, -5.69384765625, -5.2086181640625, -4.723388671875, -4.2381591796875, -3.7529296875, -3.2677001953125, -2.782470703125, -2.2972412109375, -1.81201171875, -1.3267822265625, -0.841552734375, -0.3563232421875, 0.12890625, 0.6141357421875, 1.099365234375, 1.5845947265625, 2.06982421875, 2.5550537109375, 3.040283203125, 3.5255126953125, 4.0107421875, 4.4959716796875, 4.981201171875, 5.4664306640625, 5.95166015625, 6.4368896484375, 6.922119140625, 7.4073486328125, 7.892578125, 8.3778076171875, 8.863037109375, 9.3482666015625, 9.83349609375, 10.3187255859375, 10.803955078125, 11.2891845703125, 11.7744140625, 12.2596435546875, 12.744873046875, 13.2301025390625, 13.71533203125, 14.2005615234375, 14.685791015625, 15.1710205078125, 15.65625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 5.0, 7.0, 4.0, 9.0, 14.0, 9.0, 8.0, 17.0, 15.0, 16.0, 21.0, 22.0, 32.0, 23.0, 43.0, 44.0, 55.0, 81.0, 138.0, 217.0, 1417.0, 220.0, 164.0, 85.0, 63.0, 46.0, 33.0, 30.0, 26.0, 21.0, 27.0, 14.0, 20.0, 15.0, 16.0, 11.0, 7.0, 9.0, 10.0, 6.0, 2.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-19.46875, -18.905029296875, -18.34130859375, -17.777587890625, -17.2138671875, -16.650146484375, -16.08642578125, -15.522705078125, -14.958984375, -14.395263671875, -13.83154296875, -13.267822265625, -12.7041015625, -12.140380859375, -11.57666015625, -11.012939453125, -10.44921875, -9.885498046875, -9.32177734375, -8.758056640625, -8.1943359375, -7.630615234375, -7.06689453125, -6.503173828125, -5.939453125, -5.375732421875, -4.81201171875, -4.248291015625, -3.6845703125, -3.120849609375, -2.55712890625, -1.993408203125, -1.4296875, -0.865966796875, -0.30224609375, 0.261474609375, 0.8251953125, 1.388916015625, 1.95263671875, 2.516357421875, 3.080078125, 3.643798828125, 4.20751953125, 4.771240234375, 5.3349609375, 5.898681640625, 6.46240234375, 7.026123046875, 7.58984375, 8.153564453125, 8.71728515625, 9.281005859375, 9.8447265625, 10.408447265625, 10.97216796875, 11.535888671875, 12.099609375, 12.663330078125, 13.22705078125, 13.790771484375, 14.3544921875, 14.918212890625, 15.48193359375, 16.045654296875, 16.609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 8.0, 12.0, 9.0, 16.0, 16.0, 21.0, 28.0, 30.0, 49.0, 51.0, 68.0, 95.0, 154.0, 210.0, 370.0, 708.0, 1535.0, 5277.0, 3071567.0, 60447.0, 2543.0, 1038.0, 494.0, 282.0, 177.0, 112.0, 82.0, 71.0, 48.0, 30.0, 29.0, 18.0, 19.0, 17.0, 18.0, 13.0, 9.0, 6.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.875, -65.4306640625, -62.986328125, -60.5419921875, -58.09765625, -55.6533203125, -53.208984375, -50.7646484375, -48.3203125, -45.8759765625, -43.431640625, -40.9873046875, -38.54296875, -36.0986328125, -33.654296875, -31.2099609375, -28.765625, -26.3212890625, -23.876953125, -21.4326171875, -18.98828125, -16.5439453125, -14.099609375, -11.6552734375, -9.2109375, -6.7666015625, -4.322265625, -1.8779296875, 0.56640625, 3.0107421875, 5.455078125, 7.8994140625, 10.34375, 12.7880859375, 15.232421875, 17.6767578125, 20.12109375, 22.5654296875, 25.009765625, 27.4541015625, 29.8984375, 32.3427734375, 34.787109375, 37.2314453125, 39.67578125, 42.1201171875, 44.564453125, 47.0087890625, 49.453125, 51.8974609375, 54.341796875, 56.7861328125, 59.23046875, 61.6748046875, 64.119140625, 66.5634765625, 69.0078125, 71.4521484375, 73.896484375, 76.3408203125, 78.78515625, 81.2294921875, 83.673828125, 86.1181640625, 88.5625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 16.0, 33.0, 77.0, 178.0, 218.0, 232.0, 150.0, 71.0, 23.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.3274383544922, -155.07431030273438, -151.82119750976562, -148.5680694580078, -145.31495666503906, -142.06182861328125, -138.8087158203125, -135.5555877685547, -132.30247497558594, -129.04934692382812, -125.79623413085938, -122.5431137084961, -119.28999328613281, -116.03687286376953, -112.78375244140625, -109.53062438964844, -106.27750396728516, -103.02438354492188, -99.7712631225586, -96.51814270019531, -93.26502227783203, -90.01190185546875, -86.75877380371094, -83.50566101074219, -80.25253295898438, -76.9994125366211, -73.74629211425781, -70.49317169189453, -67.24005126953125, -63.98693084716797, -60.73380661010742, -57.48068618774414, -54.227569580078125, -50.974449157714844, -47.72132873535156, -44.46820831298828, -41.215087890625, -37.96196746826172, -34.70884323120117, -31.45572280883789, -28.20260238647461, -24.949481964111328, -21.696361541748047, -18.443239212036133, -15.190118789672852, -11.93699836730957, -8.683876037597656, -5.430755615234375, -2.1776351928710938, 1.0754857063293457, 4.328606605529785, 7.581727981567383, 10.834848403930664, 14.087968826293945, 17.34109115600586, 20.59421157836914, 23.847332000732422, 27.100452423095703, 30.353572845458984, 33.60669708251953, 36.85981750488281, 40.112937927246094, 43.366058349609375, 46.619178771972656, 49.87229919433594]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 0.0, 3.0, 8.0, 8.0, 9.0, 12.0, 5.0, 13.0, 17.0, 22.0, 24.0, 31.0, 27.0, 35.0, 34.0, 35.0, 31.0, 29.0, 52.0, 41.0, 59.0, 47.0, 40.0, 36.0, 33.0, 45.0, 27.0, 37.0, 25.0, 39.0, 22.0, 16.0, 24.0, 14.0, 24.0, 15.0, 12.0, 12.0, 13.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.20210266113281, -52.51921081542969, -50.83631896972656, -49.15342712402344, -47.47053909301758, -45.78764724731445, -44.10475540161133, -42.4218635559082, -40.73897171020508, -39.05607986450195, -37.37318801879883, -35.69029998779297, -34.007408142089844, -32.32451629638672, -30.641624450683594, -28.95873260498047, -27.275842666625977, -25.59295082092285, -23.91006088256836, -22.227169036865234, -20.54427719116211, -18.861385345458984, -17.178495407104492, -15.495603561401367, -13.812712669372559, -12.12982177734375, -10.446929931640625, -8.764039039611816, -7.08114767074585, -5.398256301879883, -3.715365409851074, -2.032473564147949, -0.3495826721191406, 1.3333085775375366, 3.016199827194214, 4.699090957641602, 6.381982326507568, 8.064873695373535, 9.747764587402344, 11.430656433105469, 13.113547325134277, 14.796438217163086, 16.47933006286621, 18.162220001220703, 19.845111846923828, 21.528003692626953, 23.210895538330078, 24.893787384033203, 26.576677322387695, 28.25956916809082, 29.942459106445312, 31.625350952148438, 33.30824279785156, 34.99113464355469, 36.67402648925781, 38.35691833496094, 40.0398063659668, 41.72269821166992, 43.40559005737305, 45.088478088378906, 46.77136993408203, 48.454261779785156, 50.13715362548828, 51.820045471191406, 53.50293731689453]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 7.0, 11.0, 17.0, 13.0, 12.0, 23.0, 15.0, 20.0, 24.0, 31.0, 24.0, 45.0, 34.0, 48.0, 43.0, 48.0, 44.0, 40.0, 51.0, 34.0, 43.0, 34.0, 31.0, 44.0, 27.0, 26.0, 30.0, 30.0, 19.0, 16.0, 9.0, 10.0, 14.0, 16.0, 10.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.59375, -7.3668212890625, -7.139892578125, -6.9129638671875, -6.68603515625, -6.4591064453125, -6.232177734375, -6.0052490234375, -5.7783203125, -5.5513916015625, -5.324462890625, -5.0975341796875, -4.87060546875, -4.6436767578125, -4.416748046875, -4.1898193359375, -3.962890625, -3.7359619140625, -3.509033203125, -3.2821044921875, -3.05517578125, -2.8282470703125, -2.601318359375, -2.3743896484375, -2.1474609375, -1.9205322265625, -1.693603515625, -1.4666748046875, -1.23974609375, -1.0128173828125, -0.785888671875, -0.5589599609375, -0.33203125, -0.1051025390625, 0.121826171875, 0.3487548828125, 0.57568359375, 0.8026123046875, 1.029541015625, 1.2564697265625, 1.4833984375, 1.7103271484375, 1.937255859375, 2.1641845703125, 2.39111328125, 2.6180419921875, 2.844970703125, 3.0718994140625, 3.298828125, 3.5257568359375, 3.752685546875, 3.9796142578125, 4.20654296875, 4.4334716796875, 4.660400390625, 4.8873291015625, 5.1142578125, 5.3411865234375, 5.568115234375, 5.7950439453125, 6.02197265625, 6.2489013671875, 6.475830078125, 6.7027587890625, 6.9296875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 7.0, 15.0, 21.0, 32.0, 41.0, 73.0, 141.0, 233.0, 500.0, 1093.0, 2816.0, 9157.0, 51339.0, 700770.0, 2783335.0, 587718.0, 44147.0, 8206.0, 2580.0, 1023.0, 453.0, 249.0, 119.0, 78.0, 41.0, 31.0, 31.0, 8.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.4375, -15.879638671875, -15.32177734375, -14.763916015625, -14.2060546875, -13.648193359375, -13.09033203125, -12.532470703125, -11.974609375, -11.416748046875, -10.85888671875, -10.301025390625, -9.7431640625, -9.185302734375, -8.62744140625, -8.069580078125, -7.51171875, -6.953857421875, -6.39599609375, -5.838134765625, -5.2802734375, -4.722412109375, -4.16455078125, -3.606689453125, -3.048828125, -2.490966796875, -1.93310546875, -1.375244140625, -0.8173828125, -0.259521484375, 0.29833984375, 0.856201171875, 1.4140625, 1.971923828125, 2.52978515625, 3.087646484375, 3.6455078125, 4.203369140625, 4.76123046875, 5.319091796875, 5.876953125, 6.434814453125, 6.99267578125, 7.550537109375, 8.1083984375, 8.666259765625, 9.22412109375, 9.781982421875, 10.33984375, 10.897705078125, 11.45556640625, 12.013427734375, 12.5712890625, 13.129150390625, 13.68701171875, 14.244873046875, 14.802734375, 15.360595703125, 15.91845703125, 16.476318359375, 17.0341796875, 17.592041015625, 18.14990234375, 18.707763671875, 19.265625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 26.0, 95.0, 340.0, 948.0, 1662.0, 713.0, 216.0, 60.0, 13.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.0, -59.41064453125, -57.8212890625, -56.23193359375, -54.642578125, -53.05322265625, -51.4638671875, -49.87451171875, -48.28515625, -46.69580078125, -45.1064453125, -43.51708984375, -41.927734375, -40.33837890625, -38.7490234375, -37.15966796875, -35.5703125, -33.98095703125, -32.3916015625, -30.80224609375, -29.212890625, -27.62353515625, -26.0341796875, -24.44482421875, -22.85546875, -21.26611328125, -19.6767578125, -18.08740234375, -16.498046875, -14.90869140625, -13.3193359375, -11.72998046875, -10.140625, -8.55126953125, -6.9619140625, -5.37255859375, -3.783203125, -2.19384765625, -0.6044921875, 0.98486328125, 2.57421875, 4.16357421875, 5.7529296875, 7.34228515625, 8.931640625, 10.52099609375, 12.1103515625, 13.69970703125, 15.2890625, 16.87841796875, 18.4677734375, 20.05712890625, 21.646484375, 23.23583984375, 24.8251953125, 26.41455078125, 28.00390625, 29.59326171875, 31.1826171875, 32.77197265625, 34.361328125, 35.95068359375, 37.5400390625, 39.12939453125, 40.71875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 13.0, 18.0, 78.0, 350.0, 2839.0, 4106209.0, 83254.0, 1249.0, 192.0, 58.0, 11.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.625, -87.11328125, -83.6015625, -80.08984375, -76.578125, -73.06640625, -69.5546875, -66.04296875, -62.53125, -59.01953125, -55.5078125, -51.99609375, -48.484375, -44.97265625, -41.4609375, -37.94921875, -34.4375, -30.92578125, -27.4140625, -23.90234375, -20.390625, -16.87890625, -13.3671875, -9.85546875, -6.34375, -2.83203125, 0.6796875, 4.19140625, 7.703125, 11.21484375, 14.7265625, 18.23828125, 21.75, 25.26171875, 28.7734375, 32.28515625, 35.796875, 39.30859375, 42.8203125, 46.33203125, 49.84375, 53.35546875, 56.8671875, 60.37890625, 63.890625, 67.40234375, 70.9140625, 74.42578125, 77.9375, 81.44921875, 84.9609375, 88.47265625, 91.984375, 95.49609375, 99.0078125, 102.51953125, 106.03125, 109.54296875, 113.0546875, 116.56640625, 120.078125, 123.58984375, 127.1015625, 130.61328125, 134.125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 46.0, 461.0, 457.0, 45.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.13006591796875, -279.4825134277344, -269.8349609375, -260.1874084472656, -250.53985595703125, -240.89230346679688, -231.2447509765625, -221.59719848632812, -211.94964599609375, -202.30209350585938, -192.654541015625, -183.00698852539062, -173.35943603515625, -163.71188354492188, -154.0643310546875, -144.41677856445312, -134.7692413330078, -125.12168884277344, -115.47413635253906, -105.82658386230469, -96.17903137207031, -86.53147888183594, -76.8839340209961, -67.23638153076172, -57.588829040527344, -47.94127655029297, -38.293724060058594, -28.646175384521484, -18.99862289428711, -9.351070404052734, 0.296478271484375, 9.94403076171875, 19.591583251953125, 29.2391357421875, 38.886688232421875, 48.534236907958984, 58.18178939819336, 67.829345703125, 77.47689056396484, 87.12444305419922, 96.7719955444336, 106.41954803466797, 116.06710052490234, 125.71464538574219, 135.36219787597656, 145.00975036621094, 154.6573028564453, 164.3048553466797, 173.95240783691406, 183.59996032714844, 193.2475128173828, 202.8950653076172, 212.54261779785156, 222.19017028808594, 231.83770751953125, 241.48526000976562, 251.1328125, 260.7803649902344, 270.42791748046875, 280.0754699707031, 289.7230224609375, 299.3705749511719, 309.01812744140625, 318.6656799316406, 328.313232421875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 8.0, 10.0, 10.0, 18.0, 16.0, 11.0, 26.0, 19.0, 32.0, 31.0, 39.0, 22.0, 45.0, 47.0, 35.0, 45.0, 51.0, 45.0, 37.0, 39.0, 41.0, 40.0, 50.0, 35.0, 27.0, 41.0, 30.0, 26.0, 24.0, 25.0, 12.0, 19.0, 9.0, 11.0, 9.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.79084396362305, -45.97328567504883, -44.15572738647461, -42.33816909790039, -40.52061080932617, -38.70305252075195, -36.885494232177734, -35.067935943603516, -33.2503776550293, -31.432819366455078, -29.61526107788086, -27.79770278930664, -25.980144500732422, -24.162586212158203, -22.345027923583984, -20.527469635009766, -18.709911346435547, -16.892353057861328, -15.07479476928711, -13.25723648071289, -11.439678192138672, -9.622119903564453, -7.804561614990234, -5.987003326416016, -4.169445037841797, -2.351886749267578, -0.5343284606933594, 1.2832298278808594, 3.100788116455078, 4.918346405029297, 6.735904693603516, 8.553462982177734, 10.371017456054688, 12.188575744628906, 14.006134033203125, 15.823692321777344, 17.641250610351562, 19.45880889892578, 21.2763671875, 23.09392547607422, 24.911483764648438, 26.729042053222656, 28.546600341796875, 30.364158630371094, 32.18171691894531, 33.99927520751953, 35.81683349609375, 37.63439178466797, 39.45195007324219, 41.269508361816406, 43.087066650390625, 44.904624938964844, 46.72218322753906, 48.53974151611328, 50.3572998046875, 52.17485809326172, 53.99241638183594, 55.809974670410156, 57.627532958984375, 59.445091247558594, 61.26264953613281, 63.08020782470703, 64.89776611328125, 66.71532440185547, 68.53288269042969]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 7.0, 2.0, 2.0, 7.0, 5.0, 2.0, 10.0, 11.0, 16.0, 11.0, 21.0, 20.0, 33.0, 25.0, 31.0, 31.0, 29.0, 49.0, 54.0, 50.0, 43.0, 56.0, 44.0, 39.0, 47.0, 51.0, 48.0, 33.0, 37.0, 30.0, 25.0, 27.0, 14.0, 16.0, 21.0, 6.0, 15.0, 10.0, 10.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.325439453125, -5.12744140625, -4.929443359375, -4.7314453125, -4.533447265625, -4.33544921875, -4.137451171875, -3.939453125, -3.741455078125, -3.54345703125, -3.345458984375, -3.1474609375, -2.949462890625, -2.75146484375, -2.553466796875, -2.35546875, -2.157470703125, -1.95947265625, -1.761474609375, -1.5634765625, -1.365478515625, -1.16748046875, -0.969482421875, -0.771484375, -0.573486328125, -0.37548828125, -0.177490234375, 0.0205078125, 0.218505859375, 0.41650390625, 0.614501953125, 0.8125, 1.010498046875, 1.20849609375, 1.406494140625, 1.6044921875, 1.802490234375, 2.00048828125, 2.198486328125, 2.396484375, 2.594482421875, 2.79248046875, 2.990478515625, 3.1884765625, 3.386474609375, 3.58447265625, 3.782470703125, 3.98046875, 4.178466796875, 4.37646484375, 4.574462890625, 4.7724609375, 4.970458984375, 5.16845703125, 5.366455078125, 5.564453125, 5.762451171875, 5.96044921875, 6.158447265625, 6.3564453125, 6.554443359375, 6.75244140625, 6.950439453125, 7.1484375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 13.0, 16.0, 23.0, 38.0, 37.0, 54.0, 93.0, 154.0, 239.0, 352.0, 498.0, 744.0, 1133.0, 1758.0, 2609.0, 3940.0, 5992.0, 8986.0, 13844.0, 21539.0, 33967.0, 54452.0, 87990.0, 142932.0, 204429.0, 172586.0, 108240.0, 65649.0, 41390.0, 26180.0, 17120.0, 10896.0, 6850.0, 4706.0, 3110.0, 1970.0, 1401.0, 865.0, 552.0, 398.0, 251.0, 214.0, 103.0, 67.0, 53.0, 34.0, 24.0, 30.0, 10.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.4384765625, -0.4246482849121094, -0.41082000732421875, -0.3969917297363281, -0.3831634521484375, -0.3693351745605469, -0.35550689697265625, -0.3416786193847656, -0.327850341796875, -0.3140220642089844, -0.30019378662109375, -0.2863655090332031, -0.2725372314453125, -0.2587089538574219, -0.24488067626953125, -0.23105239868164062, -0.21722412109375, -0.20339584350585938, -0.18956756591796875, -0.17573928833007812, -0.1619110107421875, -0.14808273315429688, -0.13425445556640625, -0.12042617797851562, -0.106597900390625, -0.09276962280273438, -0.07894134521484375, -0.06511306762695312, -0.0512847900390625, -0.037456512451171875, -0.02362823486328125, -0.009799957275390625, 0.0040283203125, 0.017856597900390625, 0.03168487548828125, 0.045513153076171875, 0.0593414306640625, 0.07316970825195312, 0.08699798583984375, 0.10082626342773438, 0.114654541015625, 0.12848281860351562, 0.14231109619140625, 0.15613937377929688, 0.1699676513671875, 0.18379592895507812, 0.19762420654296875, 0.21145248413085938, 0.22528076171875, 0.23910903930664062, 0.25293731689453125, 0.2667655944824219, 0.2805938720703125, 0.2944221496582031, 0.30825042724609375, 0.3220787048339844, 0.335906982421875, 0.3497352600097656, 0.36356353759765625, 0.3773918151855469, 0.3912200927734375, 0.4050483703613281, 0.41887664794921875, 0.4327049255371094, 0.446533203125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 6.0, 9.0, 7.0, 18.0, 14.0, 13.0, 26.0, 21.0, 28.0, 25.0, 19.0, 13.0, 31.0, 26.0, 32.0, 27.0, 38.0, 36.0, 36.0, 1077.0, 34.0, 33.0, 54.0, 38.0, 37.0, 44.0, 32.0, 31.0, 23.0, 19.0, 20.0, 18.0, 16.0, 25.0, 7.0, 14.0, 12.0, 15.0, 9.0, 7.0, 1.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-3.6015625, -3.49749755859375, -3.3934326171875, -3.28936767578125, -3.185302734375, -3.08123779296875, -2.9771728515625, -2.87310791015625, -2.76904296875, -2.66497802734375, -2.5609130859375, -2.45684814453125, -2.352783203125, -2.24871826171875, -2.1446533203125, -2.04058837890625, -1.9365234375, -1.83245849609375, -1.7283935546875, -1.62432861328125, -1.520263671875, -1.41619873046875, -1.3121337890625, -1.20806884765625, -1.10400390625, -0.99993896484375, -0.8958740234375, -0.79180908203125, -0.687744140625, -0.58367919921875, -0.4796142578125, -0.37554931640625, -0.271484375, -0.16741943359375, -0.0633544921875, 0.04071044921875, 0.144775390625, 0.24884033203125, 0.3529052734375, 0.45697021484375, 0.56103515625, 0.66510009765625, 0.7691650390625, 0.87322998046875, 0.977294921875, 1.08135986328125, 1.1854248046875, 1.28948974609375, 1.3935546875, 1.49761962890625, 1.6016845703125, 1.70574951171875, 1.809814453125, 1.91387939453125, 2.0179443359375, 2.12200927734375, 2.22607421875, 2.33013916015625, 2.4342041015625, 2.53826904296875, 2.642333984375, 2.74639892578125, 2.8504638671875, 2.95452880859375, 3.05859375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 7.0, 13.0, 7.0, 25.0, 24.0, 40.0, 75.0, 83.0, 128.0, 184.0, 307.0, 514.0, 726.0, 1156.0, 1791.0, 2699.0, 4138.0, 6513.0, 10119.0, 15890.0, 24559.0, 37890.0, 58809.0, 90498.0, 137906.0, 1227445.0, 160922.0, 111102.0, 72130.0, 47028.0, 30124.0, 19176.0, 12516.0, 8033.0, 5080.0, 3383.0, 2133.0, 1396.0, 843.0, 609.0, 414.0, 249.0, 153.0, 103.0, 74.0, 38.0, 33.0, 21.0, 9.0, 8.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.38671875, -0.3752555847167969, -0.36379241943359375, -0.3523292541503906, -0.3408660888671875, -0.3294029235839844, -0.31793975830078125, -0.3064765930175781, -0.295013427734375, -0.2835502624511719, -0.27208709716796875, -0.2606239318847656, -0.2491607666015625, -0.23769760131835938, -0.22623443603515625, -0.21477127075195312, -0.20330810546875, -0.19184494018554688, -0.18038177490234375, -0.16891860961914062, -0.1574554443359375, -0.14599227905273438, -0.13452911376953125, -0.12306594848632812, -0.111602783203125, -0.10013961791992188, -0.08867645263671875, -0.07721328735351562, -0.0657501220703125, -0.054286956787109375, -0.04282379150390625, -0.031360626220703125, -0.0198974609375, -0.008434295654296875, 0.00302886962890625, 0.014492034912109375, 0.0259552001953125, 0.037418365478515625, 0.04888153076171875, 0.060344696044921875, 0.071807861328125, 0.08327102661132812, 0.09473419189453125, 0.10619735717773438, 0.1176605224609375, 0.12912368774414062, 0.14058685302734375, 0.15205001831054688, 0.16351318359375, 0.17497634887695312, 0.18643951416015625, 0.19790267944335938, 0.2093658447265625, 0.22082901000976562, 0.23229217529296875, 0.24375534057617188, 0.255218505859375, 0.2666816711425781, 0.27814483642578125, 0.2896080017089844, 0.3010711669921875, 0.3125343322753906, 0.32399749755859375, 0.3354606628417969, 0.346923828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 6.0, 5.0, 4.0, 8.0, 8.0, 10.0, 24.0, 27.0, 25.0, 35.0, 32.0, 33.0, 45.0, 37.0, 50.0, 53.0, 76.0, 52.0, 55.0, 43.0, 52.0, 40.0, 44.0, 39.0, 32.0, 24.0, 27.0, 27.0, 26.0, 8.0, 12.0, 10.0, 9.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00109100341796875, -0.0010564029216766357, -0.0010218024253845215, -0.0009872019290924072, -0.000952601432800293, -0.0009180009365081787, -0.0008834004402160645, -0.0008487999439239502, -0.0008141994476318359, -0.0007795989513397217, -0.0007449984550476074, -0.0007103979587554932, -0.0006757974624633789, -0.0006411969661712646, -0.0006065964698791504, -0.0005719959735870361, -0.0005373954772949219, -0.0005027949810028076, -0.00046819448471069336, -0.0004335939884185791, -0.00039899349212646484, -0.0003643929958343506, -0.00032979249954223633, -0.00029519200325012207, -0.0002605915069580078, -0.00022599101066589355, -0.0001913905143737793, -0.00015679001808166504, -0.00012218952178955078, -8.758902549743652e-05, -5.2988529205322266e-05, -1.8388032913208008e-05, 1.621246337890625e-05, 5.081295967102051e-05, 8.541345596313477e-05, 0.00012001395225524902, 0.00015461444854736328, 0.00018921494483947754, 0.0002238154411315918, 0.00025841593742370605, 0.0002930164337158203, 0.00032761693000793457, 0.00036221742630004883, 0.0003968179225921631, 0.00043141841888427734, 0.0004660189151763916, 0.0005006194114685059, 0.0005352199077606201, 0.0005698204040527344, 0.0006044209003448486, 0.0006390213966369629, 0.0006736218929290771, 0.0007082223892211914, 0.0007428228855133057, 0.0007774233818054199, 0.0008120238780975342, 0.0008466243743896484, 0.0008812248706817627, 0.000915825366973877, 0.0009504258632659912, 0.0009850263595581055, 0.0010196268558502197, 0.001054227352142334, 0.0010888278484344482, 0.0011234283447265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 7.0, 10.0, 11.0, 12.0, 17.0, 17.0, 44.0, 32.0, 47.0, 70.0, 88.0, 114.0, 156.0, 250.0, 345.0, 588.0, 1007.0, 9320.0, 1020753.0, 12771.0, 1049.0, 595.0, 360.0, 244.0, 139.0, 104.0, 103.0, 83.0, 54.0, 25.0, 30.0, 18.0, 20.0, 17.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0196990966796875, -0.019074201583862305, -0.01844930648803711, -0.017824411392211914, -0.01719951629638672, -0.016574621200561523, -0.015949726104736328, -0.015324831008911133, -0.014699935913085938, -0.014075040817260742, -0.013450145721435547, -0.012825250625610352, -0.012200355529785156, -0.011575460433959961, -0.010950565338134766, -0.01032567024230957, -0.009700775146484375, -0.00907588005065918, -0.008450984954833984, -0.007826089859008789, -0.007201194763183594, -0.0065762996673583984, -0.005951404571533203, -0.005326509475708008, -0.0047016143798828125, -0.004076719284057617, -0.003451824188232422, -0.0028269290924072266, -0.0022020339965820312, -0.001577138900756836, -0.0009522438049316406, -0.0003273487091064453, 0.00029754638671875, 0.0009224414825439453, 0.0015473365783691406, 0.002172231674194336, 0.0027971267700195312, 0.0034220218658447266, 0.004046916961669922, 0.004671812057495117, 0.0052967071533203125, 0.005921602249145508, 0.006546497344970703, 0.0071713924407958984, 0.007796287536621094, 0.008421182632446289, 0.009046077728271484, 0.00967097282409668, 0.010295867919921875, 0.01092076301574707, 0.011545658111572266, 0.012170553207397461, 0.012795448303222656, 0.013420343399047852, 0.014045238494873047, 0.014670133590698242, 0.015295028686523438, 0.015919923782348633, 0.016544818878173828, 0.017169713973999023, 0.01779460906982422, 0.018419504165649414, 0.01904439926147461, 0.019669294357299805, 0.020294189453125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 14.0, 35.0, 95.0, 179.0, 251.0, 219.0, 143.0, 57.0, 13.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00028665721765719354, -0.00024328375002369285, -0.00019991029694210738, -0.0001565368438605219, -0.00011316337622702122, -6.978990859352052e-05, -2.6416470063850284e-05, 1.695699756965041e-05, 6.033046520315111e-05, 0.00010370392556069419, 0.00014707738591823727, 0.00019045083899982274, 0.00023382430663332343, 0.0002771977742668241, 0.00032057121279649436, 0.00036394468042999506, 0.00040731814806349576, 0.00045069161569699645, 0.0004940650542266667, 0.0005374385509639978, 0.0005808119894936681, 0.0006241854280233383, 0.0006675588665530086, 0.0007109323632903397, 0.0007543058600276709, 0.0007976792985573411, 0.0008410527952946723, 0.0008844262338243425, 0.0009277997305616736, 0.0009711731690913439, 0.0010145466076210141, 0.0010579200461506844, 0.0011012936010956764, 0.0011446670396253467, 0.001188040478155017, 0.001231414033100009, 0.0012747874716296792, 0.0013181609101593494, 0.0013615343486890197, 0.00140490778721869, 0.001448281342163682, 0.0014916547806933522, 0.0015350282192230225, 0.0015784017741680145, 0.0016217752126976848, 0.001665148651227355, 0.0017085220897570252, 0.0017518955282866955, 0.0017952689668163657, 0.001838642405346036, 0.0018820158438757062, 0.0019253892824053764, 0.0019687628373503685, 0.0020121363922953606, 0.002055509714409709, 0.002098883269354701, 0.0021422565914690495, 0.0021856301464140415, 0.00222900346852839, 0.002272377023473382, 0.0023157503455877304, 0.0023591239005327225, 0.0024024974554777145, 0.002445870777592063, 0.002489244332537055]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 8.0, 3.0, 8.0, 9.0, 5.0, 6.0, 7.0, 12.0, 16.0, 15.0, 24.0, 14.0, 31.0, 18.0, 24.0, 32.0, 27.0, 38.0, 36.0, 30.0, 49.0, 44.0, 48.0, 43.0, 35.0, 36.0, 42.0, 31.0, 25.0, 25.0, 32.0, 30.0, 26.0, 22.0, 21.0, 15.0, 15.0, 20.0, 12.0, 9.0, 8.0, 13.0, 12.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0005502700805664062, -0.0005331402644515038, -0.0005160104483366013, -0.0004988806322216988, -0.00048175081610679626, -0.00046462099999189377, -0.00044749118387699127, -0.0004303613677620888, -0.0004132315516471863, -0.0003961017355322838, -0.0003789719194173813, -0.0003618421033024788, -0.0003447122871875763, -0.0003275824710726738, -0.0003104526549577713, -0.0002933228388428688, -0.0002761930227279663, -0.0002590632066130638, -0.00024193339049816132, -0.00022480357438325882, -0.00020767375826835632, -0.00019054394215345383, -0.00017341412603855133, -0.00015628430992364883, -0.00013915449380874634, -0.00012202467769384384, -0.00010489486157894135, -8.776504546403885e-05, -7.063522934913635e-05, -5.3505413234233856e-05, -3.637559711933136e-05, -1.9245781004428864e-05, -2.115964889526367e-06, 1.5013851225376129e-05, 3.2143667340278625e-05, 4.927348345518112e-05, 6.640329957008362e-05, 8.353311568498611e-05, 0.00010066293179988861, 0.00011779274791479111, 0.0001349225640296936, 0.0001520523801445961, 0.0001691821962594986, 0.0001863120123744011, 0.0002034418284893036, 0.00022057164460420609, 0.00023770146071910858, 0.0002548312768340111, 0.0002719610929489136, 0.00028909090906381607, 0.00030622072517871857, 0.00032335054129362106, 0.00034048035740852356, 0.00035761017352342606, 0.00037473998963832855, 0.00039186980575323105, 0.00040899962186813354, 0.00042612943798303604, 0.00044325925409793854, 0.00046038907021284103, 0.00047751888632774353, 0.000494648702442646, 0.0005117785185575485, 0.000528908334672451, 0.0005460381507873535]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 7.0, 2.0, 2.0, 7.0, 5.0, 2.0, 10.0, 11.0, 16.0, 11.0, 21.0, 20.0, 33.0, 25.0, 31.0, 31.0, 29.0, 49.0, 54.0, 50.0, 43.0, 56.0, 44.0, 39.0, 47.0, 51.0, 48.0, 33.0, 37.0, 30.0, 25.0, 27.0, 14.0, 16.0, 21.0, 6.0, 15.0, 10.0, 10.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.325439453125, -5.12744140625, -4.929443359375, -4.7314453125, -4.533447265625, -4.33544921875, -4.137451171875, -3.939453125, -3.741455078125, -3.54345703125, -3.345458984375, -3.1474609375, -2.949462890625, -2.75146484375, -2.553466796875, -2.35546875, -2.157470703125, -1.95947265625, -1.761474609375, -1.5634765625, -1.365478515625, -1.16748046875, -0.969482421875, -0.771484375, -0.573486328125, -0.37548828125, -0.177490234375, 0.0205078125, 0.218505859375, 0.41650390625, 0.614501953125, 0.8125, 1.010498046875, 1.20849609375, 1.406494140625, 1.6044921875, 1.802490234375, 2.00048828125, 2.198486328125, 2.396484375, 2.594482421875, 2.79248046875, 2.990478515625, 3.1884765625, 3.386474609375, 3.58447265625, 3.782470703125, 3.98046875, 4.178466796875, 4.37646484375, 4.574462890625, 4.7724609375, 4.970458984375, 5.16845703125, 5.366455078125, 5.564453125, 5.762451171875, 5.96044921875, 6.158447265625, 6.3564453125, 6.554443359375, 6.75244140625, 6.950439453125, 7.1484375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 7.0, 9.0, 13.0, 2.0, 18.0, 24.0, 29.0, 42.0, 57.0, 99.0, 112.0, 178.0, 231.0, 339.0, 509.0, 764.0, 1354.0, 2557.0, 6795.0, 27940.0, 245810.0, 657200.0, 81862.0, 13352.0, 4299.0, 1897.0, 1027.0, 602.0, 450.0, 263.0, 166.0, 155.0, 83.0, 89.0, 53.0, 53.0, 28.0, 26.0, 14.0, 17.0, 5.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.3046875, -11.898193359375, -11.49169921875, -11.085205078125, -10.6787109375, -10.272216796875, -9.86572265625, -9.459228515625, -9.052734375, -8.646240234375, -8.23974609375, -7.833251953125, -7.4267578125, -7.020263671875, -6.61376953125, -6.207275390625, -5.80078125, -5.394287109375, -4.98779296875, -4.581298828125, -4.1748046875, -3.768310546875, -3.36181640625, -2.955322265625, -2.548828125, -2.142333984375, -1.73583984375, -1.329345703125, -0.9228515625, -0.516357421875, -0.10986328125, 0.296630859375, 0.703125, 1.109619140625, 1.51611328125, 1.922607421875, 2.3291015625, 2.735595703125, 3.14208984375, 3.548583984375, 3.955078125, 4.361572265625, 4.76806640625, 5.174560546875, 5.5810546875, 5.987548828125, 6.39404296875, 6.800537109375, 7.20703125, 7.613525390625, 8.02001953125, 8.426513671875, 8.8330078125, 9.239501953125, 9.64599609375, 10.052490234375, 10.458984375, 10.865478515625, 11.27197265625, 11.678466796875, 12.0849609375, 12.491455078125, 12.89794921875, 13.304443359375, 13.7109375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 8.0, 17.0, 15.0, 18.0, 26.0, 38.0, 51.0, 60.0, 105.0, 144.0, 427.0, 1603.0, 179.0, 90.0, 70.0, 52.0, 31.0, 26.0, 20.0, 10.0, 15.0, 9.0, 5.0, 12.0, 9.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.703125, -25.71875, -24.734375, -23.75, -22.765625, -21.78125, -20.796875, -19.8125, -18.828125, -17.84375, -16.859375, -15.875, -14.890625, -13.90625, -12.921875, -11.9375, -10.953125, -9.96875, -8.984375, -8.0, -7.015625, -6.03125, -5.046875, -4.0625, -3.078125, -2.09375, -1.109375, -0.125, 0.859375, 1.84375, 2.828125, 3.8125, 4.796875, 5.78125, 6.765625, 7.75, 8.734375, 9.71875, 10.703125, 11.6875, 12.671875, 13.65625, 14.640625, 15.625, 16.609375, 17.59375, 18.578125, 19.5625, 20.546875, 21.53125, 22.515625, 23.5, 24.484375, 25.46875, 26.453125, 27.4375, 28.421875, 29.40625, 30.390625, 31.375, 32.359375, 33.34375, 34.328125, 35.3125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 7.0, 8.0, 11.0, 21.0, 28.0, 40.0, 72.0, 116.0, 168.0, 266.0, 738.0, 5074.0, 3126082.0, 11230.0, 1005.0, 355.0, 190.0, 101.0, 62.0, 45.0, 27.0, 25.0, 9.0, 11.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.4375, -73.318359375, -71.19921875, -69.080078125, -66.9609375, -64.841796875, -62.72265625, -60.603515625, -58.484375, -56.365234375, -54.24609375, -52.126953125, -50.0078125, -47.888671875, -45.76953125, -43.650390625, -41.53125, -39.412109375, -37.29296875, -35.173828125, -33.0546875, -30.935546875, -28.81640625, -26.697265625, -24.578125, -22.458984375, -20.33984375, -18.220703125, -16.1015625, -13.982421875, -11.86328125, -9.744140625, -7.625, -5.505859375, -3.38671875, -1.267578125, 0.8515625, 2.970703125, 5.08984375, 7.208984375, 9.328125, 11.447265625, 13.56640625, 15.685546875, 17.8046875, 19.923828125, 22.04296875, 24.162109375, 26.28125, 28.400390625, 30.51953125, 32.638671875, 34.7578125, 36.876953125, 38.99609375, 41.115234375, 43.234375, 45.353515625, 47.47265625, 49.591796875, 51.7109375, 53.830078125, 55.94921875, 58.068359375, 60.1875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 78.0, 825.0, 103.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.83654022216797, -55.443214416503906, -48.049888610839844, -40.65656280517578, -33.26323699951172, -25.869911193847656, -18.476585388183594, -11.083259582519531, -3.6899337768554688, 3.7033920288085938, 11.096717834472656, 18.49004364013672, 25.88336944580078, 33.276695251464844, 40.670021057128906, 48.06334686279297, 55.45667266845703, 62.849998474121094, 70.24332427978516, 77.63665008544922, 85.02997589111328, 92.42330169677734, 99.8166275024414, 107.20995330810547, 114.60327911376953, 121.9966049194336, 129.38992309570312, 136.78326416015625, 144.17657470703125, 151.56991577148438, 158.96322631835938, 166.3565673828125, 173.7498779296875, 181.14320373535156, 188.53652954101562, 195.9298553466797, 203.32318115234375, 210.7165069580078, 218.10983276367188, 225.50315856933594, 232.896484375, 240.28981018066406, 247.68313598632812, 255.0764617919922, 262.46978759765625, 269.86309814453125, 277.2564392089844, 284.6497802734375, 292.0430908203125, 299.4364013671875, 306.8297424316406, 314.22308349609375, 321.61639404296875, 329.00970458984375, 336.4030456542969, 343.79638671875, 351.189697265625, 358.5830078125, 365.9763488769531, 373.36968994140625, 380.76300048828125, 388.15631103515625, 395.5496520996094, 402.9429931640625, 410.3363037109375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 9.0, 7.0, 8.0, 8.0, 10.0, 15.0, 19.0, 25.0, 23.0, 21.0, 30.0, 36.0, 23.0, 30.0, 36.0, 29.0, 47.0, 43.0, 34.0, 42.0, 42.0, 35.0, 36.0, 43.0, 36.0, 38.0, 30.0, 25.0, 28.0, 30.0, 21.0, 16.0, 14.0, 16.0, 15.0, 8.0, 10.0, 10.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-49.26926803588867, -47.708824157714844, -46.148380279541016, -44.58793640136719, -43.027496337890625, -41.4670524597168, -39.90660858154297, -38.34616470336914, -36.78572082519531, -35.225276947021484, -33.664833068847656, -32.10438919067383, -30.543947219848633, -28.983503341674805, -27.42306137084961, -25.86261749267578, -24.302173614501953, -22.741729736328125, -21.181285858154297, -19.6208438873291, -18.060400009155273, -16.499956130981445, -14.939513206481934, -13.379070281982422, -11.818626403808594, -10.258182525634766, -8.697739601135254, -7.137296199798584, -5.576852798461914, -4.016409397125244, -2.455965995788574, -0.8955230712890625, 0.6649246215820312, 2.225368022918701, 3.785811424255371, 5.346254825592041, 6.906698226928711, 8.467142105102539, 10.02758502960205, 11.588027954101562, 13.14847183227539, 14.708915710449219, 16.269359588623047, 17.829801559448242, 19.39024543762207, 20.9506893157959, 22.511131286621094, 24.071575164794922, 25.63201904296875, 27.192462921142578, 28.752906799316406, 30.3133487701416, 31.87379264831543, 33.434234619140625, 34.99467849731445, 36.55512237548828, 38.11556625366211, 39.67601013183594, 41.236454010009766, 42.796897888183594, 44.357337951660156, 45.917781829833984, 47.47822570800781, 49.03866958618164, 50.59911346435547]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 14.0, 11.0, 13.0, 18.0, 10.0, 17.0, 18.0, 31.0, 34.0, 32.0, 41.0, 38.0, 47.0, 35.0, 62.0, 37.0, 57.0, 39.0, 49.0, 41.0, 43.0, 37.0, 27.0, 39.0, 32.0, 25.0, 24.0, 22.0, 19.0, 19.0, 8.0, 8.0, 10.0, 10.0, 4.0, 4.0, 7.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.671875, -8.4202880859375, -8.168701171875, -7.9171142578125, -7.66552734375, -7.4139404296875, -7.162353515625, -6.9107666015625, -6.6591796875, -6.4075927734375, -6.156005859375, -5.9044189453125, -5.65283203125, -5.4012451171875, -5.149658203125, -4.8980712890625, -4.646484375, -4.3948974609375, -4.143310546875, -3.8917236328125, -3.64013671875, -3.3885498046875, -3.136962890625, -2.8853759765625, -2.6337890625, -2.3822021484375, -2.130615234375, -1.8790283203125, -1.62744140625, -1.3758544921875, -1.124267578125, -0.8726806640625, -0.62109375, -0.3695068359375, -0.117919921875, 0.1336669921875, 0.38525390625, 0.6368408203125, 0.888427734375, 1.1400146484375, 1.3916015625, 1.6431884765625, 1.894775390625, 2.1463623046875, 2.39794921875, 2.6495361328125, 2.901123046875, 3.1527099609375, 3.404296875, 3.6558837890625, 3.907470703125, 4.1590576171875, 4.41064453125, 4.6622314453125, 4.913818359375, 5.1654052734375, 5.4169921875, 5.6685791015625, 5.920166015625, 6.1717529296875, 6.42333984375, 6.6749267578125, 6.926513671875, 7.1781005859375, 7.4296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 2.0, 2.0, 5.0, 7.0, 10.0, 17.0, 21.0, 26.0, 27.0, 38.0, 52.0, 88.0, 128.0, 159.0, 189.0, 275.0, 442.0, 640.0, 1103.0, 2953.0, 34420.0, 3327362.0, 812960.0, 8800.0, 1860.0, 833.0, 560.0, 371.0, 246.0, 186.0, 124.0, 88.0, 78.0, 55.0, 41.0, 27.0, 21.0, 14.0, 9.0, 12.0, 6.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0], "bins": [-47.96875, -46.6650390625, -45.361328125, -44.0576171875, -42.75390625, -41.4501953125, -40.146484375, -38.8427734375, -37.5390625, -36.2353515625, -34.931640625, -33.6279296875, -32.32421875, -31.0205078125, -29.716796875, -28.4130859375, -27.109375, -25.8056640625, -24.501953125, -23.1982421875, -21.89453125, -20.5908203125, -19.287109375, -17.9833984375, -16.6796875, -15.3759765625, -14.072265625, -12.7685546875, -11.46484375, -10.1611328125, -8.857421875, -7.5537109375, -6.25, -4.9462890625, -3.642578125, -2.3388671875, -1.03515625, 0.2685546875, 1.572265625, 2.8759765625, 4.1796875, 5.4833984375, 6.787109375, 8.0908203125, 9.39453125, 10.6982421875, 12.001953125, 13.3056640625, 14.609375, 15.9130859375, 17.216796875, 18.5205078125, 19.82421875, 21.1279296875, 22.431640625, 23.7353515625, 25.0390625, 26.3427734375, 27.646484375, 28.9501953125, 30.25390625, 31.5576171875, 32.861328125, 34.1650390625, 35.46875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 8.0, 6.0, 22.0, 88.0, 368.0, 1253.0, 1512.0, 594.0, 153.0, 44.0, 17.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.36279296875, -39.0693359375, -37.77587890625, -36.482421875, -35.18896484375, -33.8955078125, -32.60205078125, -31.30859375, -30.01513671875, -28.7216796875, -27.42822265625, -26.134765625, -24.84130859375, -23.5478515625, -22.25439453125, -20.9609375, -19.66748046875, -18.3740234375, -17.08056640625, -15.787109375, -14.49365234375, -13.2001953125, -11.90673828125, -10.61328125, -9.31982421875, -8.0263671875, -6.73291015625, -5.439453125, -4.14599609375, -2.8525390625, -1.55908203125, -0.265625, 1.02783203125, 2.3212890625, 3.61474609375, 4.908203125, 6.20166015625, 7.4951171875, 8.78857421875, 10.08203125, 11.37548828125, 12.6689453125, 13.96240234375, 15.255859375, 16.54931640625, 17.8427734375, 19.13623046875, 20.4296875, 21.72314453125, 23.0166015625, 24.31005859375, 25.603515625, 26.89697265625, 28.1904296875, 29.48388671875, 30.77734375, 32.07080078125, 33.3642578125, 34.65771484375, 35.951171875, 37.24462890625, 38.5380859375, 39.83154296875, 41.125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 2.0, 3.0, 3.0, 15.0, 21.0, 38.0, 91.0, 217.0, 442.0, 1231.0, 6943.0, 1344939.0, 2828211.0, 9755.0, 1459.0, 496.0, 199.0, 104.0, 39.0, 21.0, 10.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.78125, -39.4248046875, -38.068359375, -36.7119140625, -35.35546875, -33.9990234375, -32.642578125, -31.2861328125, -29.9296875, -28.5732421875, -27.216796875, -25.8603515625, -24.50390625, -23.1474609375, -21.791015625, -20.4345703125, -19.078125, -17.7216796875, -16.365234375, -15.0087890625, -13.65234375, -12.2958984375, -10.939453125, -9.5830078125, -8.2265625, -6.8701171875, -5.513671875, -4.1572265625, -2.80078125, -1.4443359375, -0.087890625, 1.2685546875, 2.625, 3.9814453125, 5.337890625, 6.6943359375, 8.05078125, 9.4072265625, 10.763671875, 12.1201171875, 13.4765625, 14.8330078125, 16.189453125, 17.5458984375, 18.90234375, 20.2587890625, 21.615234375, 22.9716796875, 24.328125, 25.6845703125, 27.041015625, 28.3974609375, 29.75390625, 31.1103515625, 32.466796875, 33.8232421875, 35.1796875, 36.5361328125, 37.892578125, 39.2490234375, 40.60546875, 41.9619140625, 43.318359375, 44.6748046875, 46.03125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 9.0, 11.0, 23.0, 27.0, 51.0, 57.0, 75.0, 83.0, 102.0, 115.0, 110.0, 90.0, 76.0, 51.0, 41.0, 29.0, 25.0, 10.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.0187759399414, -97.2203140258789, -94.42184448242188, -91.62338256835938, -88.82491302490234, -86.02645111083984, -83.22798156738281, -80.42951965332031, -77.63105773925781, -74.83259582519531, -72.03412628173828, -69.23566436767578, -66.43719482421875, -63.63873291015625, -60.840267181396484, -58.04180145263672, -55.24333572387695, -52.44486999511719, -49.64640426635742, -46.847938537597656, -44.049476623535156, -41.25101089477539, -38.452545166015625, -35.654083251953125, -32.855613708496094, -30.057147979736328, -27.258684158325195, -24.46021842956543, -21.661754608154297, -18.86328887939453, -16.064823150634766, -13.266359329223633, -10.4678955078125, -7.669430732727051, -4.870965480804443, -2.072500228881836, 0.7259645462036133, 3.5244293212890625, 6.322895050048828, 9.121358871459961, 11.919824600219727, 14.718289375305176, 17.516754150390625, 20.31521987915039, 23.113685607910156, 25.91214942932129, 28.710615158081055, 31.509078979492188, 34.30754470825195, 37.10601043701172, 39.904476165771484, 42.70294189453125, 45.50140380859375, 48.299869537353516, 51.09833526611328, 53.89679718017578, 56.69526672363281, 59.49373245239258, 62.292198181152344, 65.09066009521484, 67.88912963867188, 70.68759155273438, 73.48605346679688, 76.2845230102539, 79.0829849243164]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 11.0, 6.0, 6.0, 7.0, 8.0, 9.0, 17.0, 12.0, 22.0, 22.0, 35.0, 28.0, 33.0, 33.0, 38.0, 31.0, 34.0, 43.0, 43.0, 43.0, 44.0, 41.0, 49.0, 42.0, 45.0, 22.0, 40.0, 23.0, 33.0, 30.0, 20.0, 23.0, 19.0, 14.0, 11.0, 10.0, 11.0, 5.0, 11.0, 5.0, 9.0, 4.0, 8.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.16655349731445, -37.79261016845703, -36.418663024902344, -35.04471969604492, -33.670772552490234, -32.29682922363281, -30.922883987426758, -29.548938751220703, -28.17499351501465, -26.801048278808594, -25.42710304260254, -24.053157806396484, -22.679214477539062, -21.305267333984375, -19.931324005126953, -18.5573787689209, -17.183433532714844, -15.809488296508789, -14.435543060302734, -13.061598777770996, -11.687653541564941, -10.313708305358887, -8.939764022827148, -7.565818786621094, -6.191873550415039, -4.817928314208984, -3.443983554840088, -2.0700387954711914, -0.6960935592651367, 0.677851676940918, 2.0517959594726562, 3.425741195678711, 4.799690246582031, 6.173635482788086, 7.547580242156982, 8.921525001525879, 10.295470237731934, 11.669415473937988, 13.043359756469727, 14.417304992675781, 15.791250228881836, 17.16519546508789, 18.539140701293945, 19.9130859375, 21.287029266357422, 22.66097640991211, 24.03491973876953, 25.408864974975586, 26.78281021118164, 28.156755447387695, 29.53070068359375, 30.904644012451172, 32.27859115600586, 33.65253448486328, 35.02648162841797, 36.40042495727539, 37.77436828613281, 39.148311614990234, 40.52225875854492, 41.896202087402344, 43.27014923095703, 44.64409255981445, 46.018035888671875, 47.39198303222656, 48.76593017578125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 5.0, 7.0, 10.0, 11.0, 16.0, 16.0, 24.0, 15.0, 29.0, 30.0, 44.0, 31.0, 30.0, 38.0, 43.0, 41.0, 40.0, 46.0, 43.0, 49.0, 47.0, 42.0, 51.0, 24.0, 34.0, 25.0, 31.0, 29.0, 20.0, 14.0, 16.0, 17.0, 13.0, 11.0, 10.0, 6.0, 9.0, 9.0, 8.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.6875, -76.0126953125, -73.337890625, -70.6630859375, -67.98828125, -65.3134765625, -62.638671875, -59.9638671875, -57.2890625, -54.6142578125, -51.939453125, -49.2646484375, -46.58984375, -43.9150390625, -41.240234375, -38.5654296875, -35.890625, -33.2158203125, -30.541015625, -27.8662109375, -25.19140625, -22.5166015625, -19.841796875, -17.1669921875, -14.4921875, -11.8173828125, -9.142578125, -6.4677734375, -3.79296875, -1.1181640625, 1.556640625, 4.2314453125, 6.90625, 9.5810546875, 12.255859375, 14.9306640625, 17.60546875, 20.2802734375, 22.955078125, 25.6298828125, 28.3046875, 30.9794921875, 33.654296875, 36.3291015625, 39.00390625, 41.6787109375, 44.353515625, 47.0283203125, 49.703125, 52.3779296875, 55.052734375, 57.7275390625, 60.40234375, 63.0771484375, 65.751953125, 68.4267578125, 71.1015625, 73.7763671875, 76.451171875, 79.1259765625, 81.80078125, 84.4755859375, 87.150390625, 89.8251953125, 92.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 13.0, 15.0, 36.0, 36.0, 67.0, 108.0, 176.0, 251.0, 445.0, 620.0, 955.0, 1421.0, 2157.0, 3130.0, 4821.0, 7104.0, 10613.0, 15360.0, 23306.0, 34972.0, 52678.0, 80170.0, 122507.0, 174126.0, 169161.0, 116686.0, 76830.0, 50292.0, 33468.0, 22085.0, 14756.0, 9894.0, 6636.0, 4510.0, 3163.0, 2005.0, 1313.0, 911.0, 593.0, 429.0, 271.0, 157.0, 114.0, 82.0, 43.0, 22.0, 16.0, 11.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0], "bins": [-5.83984375, -5.66778564453125, -5.4957275390625, -5.32366943359375, -5.151611328125, -4.97955322265625, -4.8074951171875, -4.63543701171875, -4.46337890625, -4.29132080078125, -4.1192626953125, -3.94720458984375, -3.775146484375, -3.60308837890625, -3.4310302734375, -3.25897216796875, -3.0869140625, -2.91485595703125, -2.7427978515625, -2.57073974609375, -2.398681640625, -2.22662353515625, -2.0545654296875, -1.88250732421875, -1.71044921875, -1.53839111328125, -1.3663330078125, -1.19427490234375, -1.022216796875, -0.85015869140625, -0.6781005859375, -0.50604248046875, -0.333984375, -0.16192626953125, 0.0101318359375, 0.18218994140625, 0.354248046875, 0.52630615234375, 0.6983642578125, 0.87042236328125, 1.04248046875, 1.21453857421875, 1.3865966796875, 1.55865478515625, 1.730712890625, 1.90277099609375, 2.0748291015625, 2.24688720703125, 2.4189453125, 2.59100341796875, 2.7630615234375, 2.93511962890625, 3.107177734375, 3.27923583984375, 3.4512939453125, 3.62335205078125, 3.79541015625, 3.96746826171875, 4.1395263671875, 4.31158447265625, 4.483642578125, 4.65570068359375, 4.8277587890625, 4.99981689453125, 5.171875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 0.0, 1.0, 3.0, 10.0, 13.0, 13.0, 15.0, 13.0, 21.0, 19.0, 27.0, 21.0, 36.0, 45.0, 39.0, 38.0, 39.0, 50.0, 49.0, 52.0, 1075.0, 48.0, 52.0, 48.0, 42.0, 40.0, 30.0, 38.0, 27.0, 26.0, 19.0, 11.0, 13.0, 17.0, 10.0, 9.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.15625, -52.23291015625, -50.3095703125, -48.38623046875, -46.462890625, -44.53955078125, -42.6162109375, -40.69287109375, -38.76953125, -36.84619140625, -34.9228515625, -32.99951171875, -31.076171875, -29.15283203125, -27.2294921875, -25.30615234375, -23.3828125, -21.45947265625, -19.5361328125, -17.61279296875, -15.689453125, -13.76611328125, -11.8427734375, -9.91943359375, -7.99609375, -6.07275390625, -4.1494140625, -2.22607421875, -0.302734375, 1.62060546875, 3.5439453125, 5.46728515625, 7.390625, 9.31396484375, 11.2373046875, 13.16064453125, 15.083984375, 17.00732421875, 18.9306640625, 20.85400390625, 22.77734375, 24.70068359375, 26.6240234375, 28.54736328125, 30.470703125, 32.39404296875, 34.3173828125, 36.24072265625, 38.1640625, 40.08740234375, 42.0107421875, 43.93408203125, 45.857421875, 47.78076171875, 49.7041015625, 51.62744140625, 53.55078125, 55.47412109375, 57.3974609375, 59.32080078125, 61.244140625, 63.16748046875, 65.0908203125, 67.01416015625, 68.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 18.0, 14.0, 36.0, 67.0, 76.0, 100.0, 173.0, 250.0, 396.0, 606.0, 951.0, 1519.0, 2356.0, 3729.0, 5719.0, 9149.0, 14579.0, 22695.0, 36381.0, 57790.0, 92529.0, 146000.0, 1241888.0, 165937.0, 110278.0, 68265.0, 42413.0, 26499.0, 16829.0, 10809.0, 6843.0, 4324.0, 2832.0, 1712.0, 1162.0, 788.0, 487.0, 307.0, 217.0, 132.0, 102.0, 46.0, 45.0, 31.0, 18.0, 15.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.2489013671875, -5.072021484375, -4.8951416015625, -4.71826171875, -4.5413818359375, -4.364501953125, -4.1876220703125, -4.0107421875, -3.8338623046875, -3.656982421875, -3.4801025390625, -3.30322265625, -3.1263427734375, -2.949462890625, -2.7725830078125, -2.595703125, -2.4188232421875, -2.241943359375, -2.0650634765625, -1.88818359375, -1.7113037109375, -1.534423828125, -1.3575439453125, -1.1806640625, -1.0037841796875, -0.826904296875, -0.6500244140625, -0.47314453125, -0.2962646484375, -0.119384765625, 0.0574951171875, 0.234375, 0.4112548828125, 0.588134765625, 0.7650146484375, 0.94189453125, 1.1187744140625, 1.295654296875, 1.4725341796875, 1.6494140625, 1.8262939453125, 2.003173828125, 2.1800537109375, 2.35693359375, 2.5338134765625, 2.710693359375, 2.8875732421875, 3.064453125, 3.2413330078125, 3.418212890625, 3.5950927734375, 3.77197265625, 3.9488525390625, 4.125732421875, 4.3026123046875, 4.4794921875, 4.6563720703125, 4.833251953125, 5.0101318359375, 5.18701171875, 5.3638916015625, 5.540771484375, 5.7176513671875, 5.89453125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 8.0, 10.0, 14.0, 9.0, 19.0, 23.0, 25.0, 24.0, 38.0, 43.0, 52.0, 66.0, 56.0, 66.0, 75.0, 82.0, 58.0, 55.0, 45.0, 42.0, 30.0, 37.0, 19.0, 25.0, 17.0, 8.0, 10.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027374267578125, -0.02653050422668457, -0.02568674087524414, -0.02484297752380371, -0.02399921417236328, -0.02315545082092285, -0.022311687469482422, -0.021467924118041992, -0.020624160766601562, -0.019780397415161133, -0.018936634063720703, -0.018092870712280273, -0.017249107360839844, -0.016405344009399414, -0.015561580657958984, -0.014717817306518555, -0.013874053955078125, -0.013030290603637695, -0.012186527252197266, -0.011342763900756836, -0.010499000549316406, -0.009655237197875977, -0.008811473846435547, -0.007967710494995117, -0.0071239471435546875, -0.006280183792114258, -0.005436420440673828, -0.0045926570892333984, -0.0037488937377929688, -0.002905130386352539, -0.0020613670349121094, -0.0012176036834716797, -0.00037384033203125, 0.0004699230194091797, 0.0013136863708496094, 0.002157449722290039, 0.0030012130737304688, 0.0038449764251708984, 0.004688739776611328, 0.005532503128051758, 0.0063762664794921875, 0.007220029830932617, 0.008063793182373047, 0.008907556533813477, 0.009751319885253906, 0.010595083236694336, 0.011438846588134766, 0.012282609939575195, 0.013126373291015625, 0.013970136642456055, 0.014813899993896484, 0.015657663345336914, 0.016501426696777344, 0.017345190048217773, 0.018188953399658203, 0.019032716751098633, 0.019876480102539062, 0.020720243453979492, 0.021564006805419922, 0.02240777015686035, 0.02325153350830078, 0.02409529685974121, 0.02493906021118164, 0.02578282356262207, 0.0266265869140625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 7.0, 13.0, 8.0, 22.0, 16.0, 16.0, 38.0, 41.0, 63.0, 90.0, 143.0, 245.0, 367.0, 716.0, 1430.0, 3374.0, 9344.0, 33075.0, 151756.0, 510965.0, 260345.0, 53758.0, 14073.0, 4667.0, 1855.0, 805.0, 455.0, 277.0, 190.0, 96.0, 89.0, 40.0, 44.0, 32.0, 32.0, 15.0, 11.0, 11.0, 4.0, 4.0, 6.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1533203125, -0.14832115173339844, -0.14332199096679688, -0.1383228302001953, -0.13332366943359375, -0.1283245086669922, -0.12332534790039062, -0.11832618713378906, -0.1133270263671875, -0.10832786560058594, -0.10332870483398438, -0.09832954406738281, -0.09333038330078125, -0.08833122253417969, -0.08333206176757812, -0.07833290100097656, -0.073333740234375, -0.06833457946777344, -0.06333541870117188, -0.05833625793457031, -0.05333709716796875, -0.04833793640136719, -0.043338775634765625, -0.03833961486816406, -0.0333404541015625, -0.028341293334960938, -0.023342132568359375, -0.018342971801757812, -0.01334381103515625, -0.008344650268554688, -0.003345489501953125, 0.0016536712646484375, 0.00665283203125, 0.011651992797851562, 0.016651153564453125, 0.021650314331054688, 0.02664947509765625, 0.03164863586425781, 0.036647796630859375, 0.04164695739746094, 0.0466461181640625, 0.05164527893066406, 0.056644439697265625, 0.06164360046386719, 0.06664276123046875, 0.07164192199707031, 0.07664108276367188, 0.08164024353027344, 0.086639404296875, 0.09163856506347656, 0.09663772583007812, 0.10163688659667969, 0.10663604736328125, 0.11163520812988281, 0.11663436889648438, 0.12163352966308594, 0.1266326904296875, 0.13163185119628906, 0.13663101196289062, 0.1416301727294922, 0.14662933349609375, 0.1516284942626953, 0.15662765502929688, 0.16162681579589844, 0.1666259765625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 5.0, 13.0, 10.0, 18.0, 38.0, 40.0, 53.0, 89.0, 95.0, 120.0, 98.0, 79.0, 93.0, 66.0, 56.0, 39.0, 25.0, 17.0, 15.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.030228953808546066, -0.029400598257780075, -0.028572242707014084, -0.027743887156248093, -0.0269155316054821, -0.02608717605471611, -0.02525882050395012, -0.024430466815829277, -0.023602111265063286, -0.022773755714297295, -0.021945400163531303, -0.021117044612765312, -0.02028868906199932, -0.01946033537387848, -0.018631979823112488, -0.017803624272346497, -0.016975268721580505, -0.016146913170814514, -0.015318557620048523, -0.014490202069282532, -0.013661847449839115, -0.012833491899073124, -0.012005136348307133, -0.011176781728863716, -0.010348424315452576, -0.009520068764686584, -0.008691713213920593, -0.007863357663154602, -0.0070350030437111855, -0.006206647492945194, -0.005378291942179203, -0.004549936857074499, -0.0037215817719697952, -0.0028932264540344477, -0.0020648711360991, -0.001236515585333109, -0.00040816026739776134, 0.0004201950505375862, 0.0012485506013035774, 0.0020769056864082813, 0.0029052612371742725, 0.00373361655510962, 0.004561971873044968, 0.005390327423810959, 0.00621868297457695, 0.007047038059681654, 0.007875394076108932, 0.008703748695552349, 0.00953210424631834, 0.010360459797084332, 0.011188815347850323, 0.01201716996729374, 0.01284552551805973, 0.013673881068825722, 0.014502236619591713, 0.015330592170357704, 0.016158947721123695, 0.016987303271889687, 0.017815658822655678, 0.01864401437342167, 0.01947236992418766, 0.020300723612308502, 0.021129079163074493, 0.021957434713840485, 0.022785790264606476]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 8.0, 10.0, 14.0, 19.0, 26.0, 22.0, 26.0, 24.0, 35.0, 45.0, 39.0, 50.0, 37.0, 49.0, 57.0, 46.0, 45.0, 38.0, 37.0, 29.0, 43.0, 28.0, 50.0, 30.0, 22.0, 31.0, 22.0, 19.0, 16.0, 13.0, 12.0, 8.0, 2.0, 10.0, 9.0, 0.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.015018641948699951, -0.014564094133675098, -0.014109546318650246, -0.013654998503625393, -0.01320045068860054, -0.012745902873575687, -0.012291355058550835, -0.011836807243525982, -0.01138225942850113, -0.010927711613476276, -0.010473163798451424, -0.010018615983426571, -0.009564068168401718, -0.009109520353376865, -0.008654972538352013, -0.00820042472332716, -0.007745876908302307, -0.007291329093277454, -0.006836781278252602, -0.006382233463227749, -0.005927685648202896, -0.005473137833178043, -0.005018590018153191, -0.004564042203128338, -0.004109494388103485, -0.0036549465730786324, -0.0032003987580537796, -0.002745850943028927, -0.002291303128004074, -0.0018367553129792213, -0.0013822074979543686, -0.0009276596829295158, -0.0004731118679046631, -1.8564052879810333e-05, 0.0004359837621450424, 0.0008905315771698952, 0.001345079392194748, 0.0017996272072196007, 0.0022541750222444534, 0.002708722837269306, 0.003163270652294159, 0.0036178184673190117, 0.0040723662823438644, 0.004526914097368717, 0.00498146191239357, 0.005436009727418423, 0.0058905575424432755, 0.006345105357468128, 0.006799653172492981, 0.007254200987517834, 0.0077087488025426865, 0.00816329661756754, 0.008617844432592392, 0.009072392247617245, 0.009526940062642097, 0.00998148787766695, 0.010436035692691803, 0.010890583507716656, 0.011345131322741508, 0.011799679137766361, 0.012254226952791214, 0.012708774767816067, 0.01316332258284092, 0.013617870397865772, 0.014072418212890625]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 5.0, 7.0, 10.0, 11.0, 16.0, 15.0, 23.0, 16.0, 29.0, 30.0, 45.0, 30.0, 31.0, 37.0, 43.0, 40.0, 42.0, 45.0, 44.0, 45.0, 49.0, 43.0, 51.0, 25.0, 32.0, 24.0, 33.0, 30.0, 19.0, 14.0, 17.0, 16.0, 14.0, 11.0, 10.0, 6.0, 9.0, 9.0, 7.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.0751953125, -73.400390625, -70.7255859375, -68.05078125, -65.3759765625, -62.701171875, -60.0263671875, -57.3515625, -54.6767578125, -52.001953125, -49.3271484375, -46.65234375, -43.9775390625, -41.302734375, -38.6279296875, -35.953125, -33.2783203125, -30.603515625, -27.9287109375, -25.25390625, -22.5791015625, -19.904296875, -17.2294921875, -14.5546875, -11.8798828125, -9.205078125, -6.5302734375, -3.85546875, -1.1806640625, 1.494140625, 4.1689453125, 6.84375, 9.5185546875, 12.193359375, 14.8681640625, 17.54296875, 20.2177734375, 22.892578125, 25.5673828125, 28.2421875, 30.9169921875, 33.591796875, 36.2666015625, 38.94140625, 41.6162109375, 44.291015625, 46.9658203125, 49.640625, 52.3154296875, 54.990234375, 57.6650390625, 60.33984375, 63.0146484375, 65.689453125, 68.3642578125, 71.0390625, 73.7138671875, 76.388671875, 79.0634765625, 81.73828125, 84.4130859375, 87.087890625, 89.7626953125, 92.4375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 10.0, 15.0, 11.0, 22.0, 18.0, 34.0, 52.0, 82.0, 113.0, 159.0, 307.0, 410.0, 751.0, 1397.0, 2874.0, 7447.0, 26316.0, 137648.0, 538870.0, 264177.0, 48254.0, 11526.0, 3884.0, 1807.0, 853.0, 530.0, 310.0, 210.0, 124.0, 99.0, 76.0, 47.0, 23.0, 17.0, 27.0, 16.0, 11.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.265625, -14.75146484375, -14.2373046875, -13.72314453125, -13.208984375, -12.69482421875, -12.1806640625, -11.66650390625, -11.15234375, -10.63818359375, -10.1240234375, -9.60986328125, -9.095703125, -8.58154296875, -8.0673828125, -7.55322265625, -7.0390625, -6.52490234375, -6.0107421875, -5.49658203125, -4.982421875, -4.46826171875, -3.9541015625, -3.43994140625, -2.92578125, -2.41162109375, -1.8974609375, -1.38330078125, -0.869140625, -0.35498046875, 0.1591796875, 0.67333984375, 1.1875, 1.70166015625, 2.2158203125, 2.72998046875, 3.244140625, 3.75830078125, 4.2724609375, 4.78662109375, 5.30078125, 5.81494140625, 6.3291015625, 6.84326171875, 7.357421875, 7.87158203125, 8.3857421875, 8.89990234375, 9.4140625, 9.92822265625, 10.4423828125, 10.95654296875, 11.470703125, 11.98486328125, 12.4990234375, 13.01318359375, 13.52734375, 14.04150390625, 14.5556640625, 15.06982421875, 15.583984375, 16.09814453125, 16.6123046875, 17.12646484375, 17.640625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 9.0, 12.0, 10.0, 9.0, 11.0, 23.0, 25.0, 25.0, 42.0, 41.0, 31.0, 47.0, 63.0, 56.0, 49.0, 586.0, 1552.0, 58.0, 62.0, 48.0, 41.0, 37.0, 31.0, 32.0, 26.0, 16.0, 27.0, 13.0, 13.0, 7.0, 11.0, 7.0, 5.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-172.0, -167.0859375, -162.171875, -157.2578125, -152.34375, -147.4296875, -142.515625, -137.6015625, -132.6875, -127.7734375, -122.859375, -117.9453125, -113.03125, -108.1171875, -103.203125, -98.2890625, -93.375, -88.4609375, -83.546875, -78.6328125, -73.71875, -68.8046875, -63.890625, -58.9765625, -54.0625, -49.1484375, -44.234375, -39.3203125, -34.40625, -29.4921875, -24.578125, -19.6640625, -14.75, -9.8359375, -4.921875, -0.0078125, 4.90625, 9.8203125, 14.734375, 19.6484375, 24.5625, 29.4765625, 34.390625, 39.3046875, 44.21875, 49.1328125, 54.046875, 58.9609375, 63.875, 68.7890625, 73.703125, 78.6171875, 83.53125, 88.4453125, 93.359375, 98.2734375, 103.1875, 108.1015625, 113.015625, 117.9296875, 122.84375, 127.7578125, 132.671875, 137.5859375, 142.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 5.0, 14.0, 17.0, 15.0, 31.0, 50.0, 113.0, 153.0, 266.0, 447.0, 953.0, 2624.0, 16056.0, 2694155.0, 415267.0, 11268.0, 2246.0, 873.0, 446.0, 277.0, 146.0, 86.0, 67.0, 31.0, 26.0, 19.0, 13.0, 14.0, 7.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.21875, -37.90869140625, -36.5986328125, -35.28857421875, -33.978515625, -32.66845703125, -31.3583984375, -30.04833984375, -28.73828125, -27.42822265625, -26.1181640625, -24.80810546875, -23.498046875, -22.18798828125, -20.8779296875, -19.56787109375, -18.2578125, -16.94775390625, -15.6376953125, -14.32763671875, -13.017578125, -11.70751953125, -10.3974609375, -9.08740234375, -7.77734375, -6.46728515625, -5.1572265625, -3.84716796875, -2.537109375, -1.22705078125, 0.0830078125, 1.39306640625, 2.703125, 4.01318359375, 5.3232421875, 6.63330078125, 7.943359375, 9.25341796875, 10.5634765625, 11.87353515625, 13.18359375, 14.49365234375, 15.8037109375, 17.11376953125, 18.423828125, 19.73388671875, 21.0439453125, 22.35400390625, 23.6640625, 24.97412109375, 26.2841796875, 27.59423828125, 28.904296875, 30.21435546875, 31.5244140625, 32.83447265625, 34.14453125, 35.45458984375, 36.7646484375, 38.07470703125, 39.384765625, 40.69482421875, 42.0048828125, 43.31494140625, 44.625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 17.0, 19.0, 65.0, 161.0, 297.0, 254.0, 90.0, 44.0, 14.0, 16.0, 5.0, 12.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.0509262084961, -107.7363510131836, -95.42178344726562, -83.10720825195312, -70.79263305664062, -58.478065490722656, -46.163490295410156, -33.84892272949219, -21.534347534179688, -9.219775199890137, 3.094797134399414, 15.409370422363281, 27.723941802978516, 40.03851318359375, 52.35308837890625, 64.66765594482422, 76.98223114013672, 89.29680633544922, 101.61137390136719, 113.92594909667969, 126.24052429199219, 138.55508422851562, 150.86965942382812, 163.18423461914062, 175.49880981445312, 187.81338500976562, 200.12796020507812, 212.44253540039062, 224.75709533691406, 237.07167053222656, 249.38624572753906, 261.7008056640625, 274.0154113769531, 286.3299865722656, 298.6445617675781, 310.9591369628906, 323.2737121582031, 335.5882568359375, 347.90283203125, 360.2174072265625, 372.531982421875, 384.8465576171875, 397.1611328125, 409.4757080078125, 421.790283203125, 434.1048583984375, 446.41943359375, 458.7339782714844, 471.048583984375, 483.3631591796875, 495.677734375, 507.9923095703125, 520.306884765625, 532.6214599609375, 544.93603515625, 557.2506103515625, 569.5651245117188, 581.8796997070312, 594.1942749023438, 606.5088500976562, 618.8234252929688, 631.1380004882812, 643.4525756835938, 655.7671508789062, 668.0817260742188]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 8.0, 5.0, 4.0, 8.0, 8.0, 13.0, 11.0, 12.0, 14.0, 23.0, 20.0, 24.0, 26.0, 23.0, 43.0, 44.0, 41.0, 40.0, 46.0, 59.0, 48.0, 49.0, 52.0, 43.0, 44.0, 52.0, 36.0, 25.0, 31.0, 33.0, 22.0, 17.0, 21.0, 16.0, 11.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-210.40274047851562, -204.1172332763672, -197.8317108154297, -191.54620361328125, -185.2606964111328, -178.97518920898438, -172.68966674804688, -166.40415954589844, -160.11865234375, -153.83314514160156, -147.54762268066406, -141.26211547851562, -134.9766082763672, -128.69110107421875, -122.40557861328125, -116.12007141113281, -109.83454895019531, -103.54903411865234, -97.2635269165039, -90.97801208496094, -84.6925048828125, -78.40699005126953, -72.12147521972656, -65.83596801757812, -59.550453186035156, -53.26494216918945, -46.97943115234375, -40.69391632080078, -34.40840530395508, -28.122894287109375, -21.837379455566406, -15.551868438720703, -9.266357421875, -2.9808454513549805, 3.304666519165039, 9.590179443359375, 15.875690460205078, 22.16120147705078, 28.44671630859375, 34.73222732543945, 41.017738342285156, 47.30324935913086, 53.58876037597656, 59.87427520751953, 66.1597900390625, 72.44529724121094, 78.7308120727539, 85.01632690429688, 91.30183410644531, 97.58734893798828, 103.87285614013672, 110.15837097167969, 116.44387817382812, 122.7293930053711, 129.01490783691406, 135.3004150390625, 141.5859375, 147.87144470214844, 154.15696716308594, 160.44247436523438, 166.7279815673828, 173.01348876953125, 179.29901123046875, 185.5845184326172, 191.87002563476562]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 3.0, 1.0, 3.0, 8.0, 5.0, 14.0, 27.0, 42.0, 53.0, 68.0, 150.0, 167.0, 287.0, 464.0, 729.0, 952.0, 1486.0, 2229.0, 3194.0, 4806.0, 1016280.0, 6003.0, 3606.0, 2561.0, 1784.0, 1219.0, 851.0, 535.0, 376.0, 222.0, 141.0, 102.0, 75.0, 37.0, 21.0, 18.0, 12.0, 9.0, 6.0, 1.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-37.234500885009766, -36.1920051574707, -35.14950942993164, -34.10701370239258, -33.06451416015625, -32.02201843261719, -30.979522705078125, -29.937026977539062, -28.89453125, -27.852035522460938, -26.809539794921875, -25.76704216003418, -24.724546432495117, -23.682050704956055, -22.63955307006836, -21.597057342529297, -20.554561614990234, -19.512065887451172, -18.46957015991211, -17.427072525024414, -16.38457679748535, -15.342081069946289, -14.29958438873291, -13.257087707519531, -12.214591979980469, -11.172096252441406, -10.129599571228027, -9.087102890014648, -8.044607162475586, -7.002110958099365, -5.9596147537231445, -4.917118549346924, -3.8746185302734375, -2.832122325897217, -1.789626121520996, -0.7471299171447754, 0.2953662872314453, 1.337862491607666, 2.3803586959838867, 3.4228549003601074, 4.465351104736328, 5.507847309112549, 6.5503435134887695, 7.59283971786499, 8.635335922241211, 9.677831649780273, 10.720328330993652, 11.762825012207031, 12.805320739746094, 13.847816467285156, 14.890313148498535, 15.932809829711914, 16.975305557250977, 18.01780128479004, 19.060298919677734, 20.102794647216797, 21.14529037475586, 22.187786102294922, 23.230281829833984, 24.27277946472168, 25.315275192260742, 26.357770919799805, 27.4002685546875, 28.442764282226562, 29.485260009765625]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 21.0, 50.0, 81.0, 92.0, 640.0, 51461832.0, 245.0, 70.0, 44.0, 24.0, 15.0, 10.0, 7.0, 4.0, 6.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5684.64111328125, -5508.79443359375, -5332.94775390625, -5157.10107421875, -4981.25439453125, -4805.40771484375, -4629.5615234375, -4453.71484375, -4277.8681640625, -4102.021484375, -3926.1748046875, -3750.328125, -3574.4814453125, -3398.634765625, -3222.788330078125, -3046.941650390625, -2871.0947265625, -2695.248046875, -2519.4013671875, -2343.5546875, -2167.7080078125, -1991.8614501953125, -1816.014892578125, -1640.168212890625, -1464.321533203125, -1288.474853515625, -1112.628173828125, -936.7816162109375, -760.9349365234375, -585.0882568359375, -409.24169921875, -233.39501953125, -57.548828125, 118.29782104492188, 294.14447021484375, 469.9910888671875, 645.8377685546875, 821.6844482421875, 997.531005859375, 1173.377685546875, 1349.224365234375, 1525.071044921875, 1700.917724609375, 1876.7642822265625, 2052.61083984375, 2228.45751953125, 2404.30419921875, 2580.15087890625, 2755.99755859375, 2931.84423828125, 3107.69091796875, 3283.53759765625, 3459.38427734375, 3635.23095703125, 3811.077392578125, 3986.924072265625, 4162.7705078125, 4338.6171875, 4514.4638671875, 4690.310546875, 4866.1572265625, 5042.00390625, 5217.8505859375, 5393.697265625, 5569.5439453125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 8.0, 4.0, 20.0, 19.0, 25.0, 37.0, 62.0, 81.0, 119.0, 185.0, 333.0, 509.0, 816.0, 1390.0, 2227.0, 3288.0, 5395.0, 8653.0, 14019.0, 22324.0, 36217.0, 57725.0, 92325.0, 149768.0, 243521.0, 395920.0, 2914489.0, 1355507.0, 377133.0, 232158.0, 142141.0, 88373.0, 55325.0, 34506.0, 21444.0, 13351.0, 8328.0, 5169.0, 3166.0, 1928.0, 1233.0, 727.0, 523.0, 330.0, 201.0, 131.0, 94.0, 68.0, 41.0, 31.0, 31.0, 9.0, 6.0, 7.0, 2.0, 1.0, 1.0], "bins": [-2.349609375, -2.2803955078125, -2.211181640625, -2.1419677734375, -2.07275390625, -2.0035400390625, -1.934326171875, -1.8651123046875, -1.7958984375, -1.7266845703125, -1.657470703125, -1.5882568359375, -1.51904296875, -1.4498291015625, -1.380615234375, -1.3114013671875, -1.2421875, -1.1729736328125, -1.103759765625, -1.0345458984375, -0.96533203125, -0.8961181640625, -0.826904296875, -0.7576904296875, -0.6884765625, -0.6192626953125, -0.550048828125, -0.4808349609375, -0.41162109375, -0.3424072265625, -0.273193359375, -0.2039794921875, -0.134765625, -0.0655517578125, 0.003662109375, 0.0728759765625, 0.14208984375, 0.2113037109375, 0.280517578125, 0.3497314453125, 0.4189453125, 0.4881591796875, 0.557373046875, 0.6265869140625, 0.69580078125, 0.7650146484375, 0.834228515625, 0.9034423828125, 0.97265625, 1.0418701171875, 1.111083984375, 1.1802978515625, 1.24951171875, 1.3187255859375, 1.387939453125, 1.4571533203125, 1.5263671875, 1.5955810546875, 1.664794921875, 1.7340087890625, 1.80322265625, 1.8724365234375, 1.941650390625, 2.0108642578125, 2.080078125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 9.0, 6.0, 10.0, 19.0, 12.0, 12.0, 22.0, 23.0, 22.0, 23.0, 29.0, 33.0, 36.0, 32.0, 36.0, 37.0, 41.0, 44.0, 312.0, 775.0, 59.0, 34.0, 36.0, 36.0, 45.0, 34.0, 38.0, 37.0, 32.0, 19.0, 13.0, 25.0, 10.0, 19.0, 9.0, 18.0, 7.0, 3.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-19.109375, -18.566162109375, -18.02294921875, -17.479736328125, -16.9365234375, -16.393310546875, -15.85009765625, -15.306884765625, -14.763671875, -14.220458984375, -13.67724609375, -13.134033203125, -12.5908203125, -12.047607421875, -11.50439453125, -10.961181640625, -10.41796875, -9.874755859375, -9.33154296875, -8.788330078125, -8.2451171875, -7.701904296875, -7.15869140625, -6.615478515625, -6.072265625, -5.529052734375, -4.98583984375, -4.442626953125, -3.8994140625, -3.356201171875, -2.81298828125, -2.269775390625, -1.7265625, -1.183349609375, -0.64013671875, -0.096923828125, 0.4462890625, 0.989501953125, 1.53271484375, 2.075927734375, 2.619140625, 3.162353515625, 3.70556640625, 4.248779296875, 4.7919921875, 5.335205078125, 5.87841796875, 6.421630859375, 6.96484375, 7.508056640625, 8.05126953125, 8.594482421875, 9.1376953125, 9.680908203125, 10.22412109375, 10.767333984375, 11.310546875, 11.853759765625, 12.39697265625, 12.940185546875, 13.4833984375, 14.026611328125, 14.56982421875, 15.113037109375, 15.65625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 15.0, 33.0, 20.0, 36.0, 44.0, 78.0, 101.0, 153.0, 248.0, 313.0, 526.0, 776.0, 1091.0, 1634.0, 2398.0, 3865.0, 5695.0, 8769.0, 13756.0, 21510.0, 34239.0, 54895.0, 89018.0, 147162.0, 261902.0, 520578.0, 3860624.0, 574244.0, 279260.0, 156713.0, 93887.0, 57868.0, 35918.0, 22733.0, 14482.0, 9223.0, 5883.0, 4014.0, 2454.0, 1679.0, 1137.0, 784.0, 536.0, 362.0, 235.0, 166.0, 115.0, 67.0, 65.0, 53.0, 27.0, 16.0, 18.0, 8.0, 3.0, 0.0, 6.0, 3.0], "bins": [-3.21484375, -3.1160888671875, -3.017333984375, -2.9185791015625, -2.81982421875, -2.7210693359375, -2.622314453125, -2.5235595703125, -2.4248046875, -2.3260498046875, -2.227294921875, -2.1285400390625, -2.02978515625, -1.9310302734375, -1.832275390625, -1.7335205078125, -1.634765625, -1.5360107421875, -1.437255859375, -1.3385009765625, -1.23974609375, -1.1409912109375, -1.042236328125, -0.9434814453125, -0.8447265625, -0.7459716796875, -0.647216796875, -0.5484619140625, -0.44970703125, -0.3509521484375, -0.252197265625, -0.1534423828125, -0.0546875, 0.0440673828125, 0.142822265625, 0.2415771484375, 0.34033203125, 0.4390869140625, 0.537841796875, 0.6365966796875, 0.7353515625, 0.8341064453125, 0.932861328125, 1.0316162109375, 1.13037109375, 1.2291259765625, 1.327880859375, 1.4266357421875, 1.525390625, 1.6241455078125, 1.722900390625, 1.8216552734375, 1.92041015625, 2.0191650390625, 2.117919921875, 2.2166748046875, 2.3154296875, 2.4141845703125, 2.512939453125, 2.6116943359375, 2.71044921875, 2.8092041015625, 2.907958984375, 3.0067138671875, 3.10546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 2.0, 7.0, 3.0, 6.0, 6.0, 13.0, 12.0, 12.0, 13.0, 14.0, 22.0, 24.0, 23.0, 17.0, 23.0, 28.0, 35.0, 26.0, 26.0, 37.0, 39.0, 53.0, 426.0, 630.0, 75.0, 41.0, 40.0, 37.0, 40.0, 34.0, 20.0, 33.0, 18.0, 33.0, 23.0, 22.0, 18.0, 16.0, 11.0, 16.0, 11.0, 3.0, 8.0, 8.0, 9.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.90625, -9.5882568359375, -9.270263671875, -8.9522705078125, -8.63427734375, -8.3162841796875, -7.998291015625, -7.6802978515625, -7.3623046875, -7.0443115234375, -6.726318359375, -6.4083251953125, -6.09033203125, -5.7723388671875, -5.454345703125, -5.1363525390625, -4.818359375, -4.5003662109375, -4.182373046875, -3.8643798828125, -3.54638671875, -3.2283935546875, -2.910400390625, -2.5924072265625, -2.2744140625, -1.9564208984375, -1.638427734375, -1.3204345703125, -1.00244140625, -0.6844482421875, -0.366455078125, -0.0484619140625, 0.26953125, 0.5875244140625, 0.905517578125, 1.2235107421875, 1.54150390625, 1.8594970703125, 2.177490234375, 2.4954833984375, 2.8134765625, 3.1314697265625, 3.449462890625, 3.7674560546875, 4.08544921875, 4.4034423828125, 4.721435546875, 5.0394287109375, 5.357421875, 5.6754150390625, 5.993408203125, 6.3114013671875, 6.62939453125, 6.9473876953125, 7.265380859375, 7.5833740234375, 7.9013671875, 8.2193603515625, 8.537353515625, 8.8553466796875, 9.17333984375, 9.4913330078125, 9.809326171875, 10.1273193359375, 10.4453125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [5.0, 4.0, 7.0, 4.0, 3.0, 10.0, 11.0, 14.0, 21.0, 21.0, 29.0, 43.0, 53.0, 59.0, 108.0, 126.0, 150.0, 225.0, 313.0, 364.0, 488.0, 615.0, 969.0, 1255.0, 1807.0, 2703.0, 4477.0, 8403.0, 17109.0, 45463.0, 196810.0, 5861639.0, 89870.0, 28205.0, 12130.0, 6302.0, 3592.0, 2342.0, 1650.0, 1069.0, 773.0, 529.0, 404.0, 325.0, 228.0, 185.0, 130.0, 115.0, 73.0, 66.0, 42.0, 37.0, 24.0, 13.0, 8.0, 4.0, 8.0, 6.0, 2.0, 6.0, 1.0, 2.0, 3.0, 4.0], "bins": [-12.4921875, -12.0927734375, -11.693359375, -11.2939453125, -10.89453125, -10.4951171875, -10.095703125, -9.6962890625, -9.296875, -8.8974609375, -8.498046875, -8.0986328125, -7.69921875, -7.2998046875, -6.900390625, -6.5009765625, -6.1015625, -5.7021484375, -5.302734375, -4.9033203125, -4.50390625, -4.1044921875, -3.705078125, -3.3056640625, -2.90625, -2.5068359375, -2.107421875, -1.7080078125, -1.30859375, -0.9091796875, -0.509765625, -0.1103515625, 0.2890625, 0.6884765625, 1.087890625, 1.4873046875, 1.88671875, 2.2861328125, 2.685546875, 3.0849609375, 3.484375, 3.8837890625, 4.283203125, 4.6826171875, 5.08203125, 5.4814453125, 5.880859375, 6.2802734375, 6.6796875, 7.0791015625, 7.478515625, 7.8779296875, 8.27734375, 8.6767578125, 9.076171875, 9.4755859375, 9.875, 10.2744140625, 10.673828125, 11.0732421875, 11.47265625, 11.8720703125, 12.271484375, 12.6708984375, 13.0703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 13.0, 9.0, 14.0, 13.0, 15.0, 26.0, 22.0, 18.0, 21.0, 28.0, 37.0, 47.0, 56.0, 54.0, 75.0, 174.0, 646.0, 246.0, 77.0, 48.0, 44.0, 40.0, 39.0, 29.0, 37.0, 37.0, 36.0, 16.0, 15.0, 23.0, 20.0, 9.0, 7.0, 6.0, 5.0, 4.0, 7.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.05816650390625, -7.8038330078125, -7.54949951171875, -7.295166015625, -7.04083251953125, -6.7864990234375, -6.53216552734375, -6.27783203125, -6.02349853515625, -5.7691650390625, -5.51483154296875, -5.260498046875, -5.00616455078125, -4.7518310546875, -4.49749755859375, -4.2431640625, -3.98883056640625, -3.7344970703125, -3.48016357421875, -3.225830078125, -2.97149658203125, -2.7171630859375, -2.46282958984375, -2.20849609375, -1.95416259765625, -1.6998291015625, -1.44549560546875, -1.191162109375, -0.93682861328125, -0.6824951171875, -0.42816162109375, -0.173828125, 0.08050537109375, 0.3348388671875, 0.58917236328125, 0.843505859375, 1.09783935546875, 1.3521728515625, 1.60650634765625, 1.86083984375, 2.11517333984375, 2.3695068359375, 2.62384033203125, 2.878173828125, 3.13250732421875, 3.3868408203125, 3.64117431640625, 3.8955078125, 4.14984130859375, 4.4041748046875, 4.65850830078125, 4.912841796875, 5.16717529296875, 5.4215087890625, 5.67584228515625, 5.93017578125, 6.18450927734375, 6.4388427734375, 6.69317626953125, 6.947509765625, 7.20184326171875, 7.4561767578125, 7.71051025390625, 7.96484375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 8.0, 10.0, 18.0, 49.0, 97.0, 244.0, 339.0, 143.0, 46.0, 24.0, 7.0, 7.0, 9.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-47.907508850097656, -46.95437240600586, -46.00123977661133, -45.04810333251953, -44.094966888427734, -43.14183044433594, -42.188697814941406, -41.23556137084961, -40.28242492675781, -39.329288482666016, -38.376155853271484, -37.42301940917969, -36.46988296508789, -35.516746520996094, -34.56361389160156, -33.610477447509766, -32.657344818115234, -31.70421028137207, -30.751073837280273, -29.79793930053711, -28.844802856445312, -27.89166831970215, -26.938533782958984, -25.985397338867188, -25.03226089477539, -24.079126358032227, -23.12598991394043, -22.172855377197266, -21.21971893310547, -20.266584396362305, -19.31344985961914, -18.360313415527344, -17.40717887878418, -16.454044342041016, -15.500907897949219, -14.547773361206055, -13.594637870788574, -12.641502380371094, -11.688366889953613, -10.735231399536133, -9.782096862792969, -8.828961372375488, -7.875826358795166, -6.9226908683776855, -5.969555854797363, -5.016420364379883, -4.063284873962402, -3.11014986038208, -2.1570138931274414, -1.20387864112854, -0.2507432699203491, 0.7023921012878418, 1.6555273532867432, 2.6086626052856445, 3.561798095703125, 4.514933109283447, 5.468068599700928, 6.421204090118408, 7.3743391036987305, 8.327474594116211, 9.280610084533691, 10.233745574951172, 11.186880111694336, 12.140015602111816, 13.093151092529297]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 4.0, 2.0, 9.0, 10.0, 8.0, 9.0, 8.0, 14.0, 20.0, 14.0, 23.0, 17.0, 37.0, 31.0, 38.0, 39.0, 38.0, 38.0, 28.0, 45.0, 48.0, 40.0, 42.0, 48.0, 39.0, 30.0, 31.0, 30.0, 36.0, 30.0, 19.0, 22.0, 27.0, 13.0, 24.0, 10.0, 14.0, 14.0, 10.0, 10.0, 5.0, 3.0, 5.0, 2.0, 6.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.6207275390625, -9.30551815032959, -8.990309715270996, -8.675100326538086, -8.359890937805176, -8.044682502746582, -7.729473114013672, -7.41426420211792, -7.099055290222168, -6.783846378326416, -6.468636989593506, -6.153428077697754, -5.838219165802002, -5.52301025390625, -5.20780086517334, -4.892591953277588, -4.577382564544678, -4.262173652648926, -3.9469645023345947, -3.6317553520202637, -3.3165464401245117, -3.0013372898101807, -2.6861281394958496, -2.3709192276000977, -2.0557100772857666, -1.740501046180725, -1.4252920150756836, -1.1100828647613525, -0.794873833656311, -0.47966480255126953, -0.16445565223693848, 0.15075325965881348, 0.46596240997314453, 0.781171441078186, 1.0963804721832275, 1.4115896224975586, 1.7267986536026, 2.0420076847076416, 2.3572168350219727, 2.6724257469177246, 2.9876348972320557, 3.3028440475463867, 3.6180529594421387, 3.9332621097564697, 4.248471260070801, 4.563680171966553, 4.878889083862305, 5.194098472595215, 5.509307384490967, 5.824516296386719, 6.139725685119629, 6.454934597015381, 6.770143508911133, 7.085352897644043, 7.400561809539795, 7.715770721435547, 8.030980110168457, 8.346189498901367, 8.661397933959961, 8.976607322692871, 9.291816711425781, 9.607025146484375, 9.922234535217285, 10.237443923950195, 10.552652359008789]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 2.0, 5.0, 13.0, 27.0, 28.0, 49.0, 68.0, 151.0, 271.0, 541.0, 1061.0, 2240.0, 5626.0, 17872.0, 120686.0, 3978636.0, 45145.0, 12147.0, 4844.0, 2146.0, 1077.0, 556.0, 319.0, 212.0, 140.0, 110.0, 46.0, 64.0, 39.0, 38.0, 23.0, 16.0, 12.0, 8.0, 16.0, 8.0, 11.0, 11.0, 6.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20654296875, -0.19584274291992188, -0.18514251708984375, -0.17444229125976562, -0.1637420654296875, -0.15304183959960938, -0.14234161376953125, -0.13164138793945312, -0.120941162109375, -0.11024093627929688, -0.09954071044921875, -0.08884048461914062, -0.0781402587890625, -0.06744003295898438, -0.05673980712890625, -0.046039581298828125, -0.03533935546875, -0.024639129638671875, -0.01393890380859375, -0.003238677978515625, 0.0074615478515625, 0.018161773681640625, 0.02886199951171875, 0.039562225341796875, 0.050262451171875, 0.060962677001953125, 0.07166290283203125, 0.08236312866210938, 0.0930633544921875, 0.10376358032226562, 0.11446380615234375, 0.12516403198242188, 0.1358642578125, 0.14656448364257812, 0.15726470947265625, 0.16796493530273438, 0.1786651611328125, 0.18936538696289062, 0.20006561279296875, 0.21076583862304688, 0.221466064453125, 0.23216629028320312, 0.24286651611328125, 0.2535667419433594, 0.2642669677734375, 0.2749671936035156, 0.28566741943359375, 0.2963676452636719, 0.30706787109375, 0.3177680969238281, 0.32846832275390625, 0.3391685485839844, 0.3498687744140625, 0.3605690002441406, 0.37126922607421875, 0.3819694519042969, 0.392669677734375, 0.4033699035644531, 0.41407012939453125, 0.4247703552246094, 0.4354705810546875, 0.4461708068847656, 0.45687103271484375, 0.4675712585449219, 0.478271484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 7.0, 9.0, 6.0, 7.0, 12.0, 18.0, 15.0, 24.0, 403.0, 408.0, 17.0, 9.0, 13.0, 8.0, 11.0, 6.0, 1.0, 7.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042510986328125, -0.04099559783935547, -0.03948020935058594, -0.037964820861816406, -0.036449432373046875, -0.034934043884277344, -0.03341865539550781, -0.03190326690673828, -0.03038787841796875, -0.02887248992919922, -0.027357101440429688, -0.025841712951660156, -0.024326324462890625, -0.022810935974121094, -0.021295547485351562, -0.01978015899658203, -0.0182647705078125, -0.01674938201904297, -0.015233993530273438, -0.013718605041503906, -0.012203216552734375, -0.010687828063964844, -0.009172439575195312, -0.007657051086425781, -0.00614166259765625, -0.004626274108886719, -0.0031108856201171875, -0.0015954971313476562, -8.0108642578125e-05, 0.0014352798461914062, 0.0029506683349609375, 0.004466056823730469, 0.0059814453125, 0.007496833801269531, 0.009012222290039062, 0.010527610778808594, 0.012042999267578125, 0.013558387756347656, 0.015073776245117188, 0.01658916473388672, 0.01810455322265625, 0.01961994171142578, 0.021135330200195312, 0.022650718688964844, 0.024166107177734375, 0.025681495666503906, 0.027196884155273438, 0.02871227264404297, 0.0302276611328125, 0.03174304962158203, 0.03325843811035156, 0.034773826599121094, 0.036289215087890625, 0.037804603576660156, 0.03931999206542969, 0.04083538055419922, 0.04235076904296875, 0.04386615753173828, 0.04538154602050781, 0.046896934509277344, 0.048412322998046875, 0.049927711486816406, 0.05144309997558594, 0.05295848846435547, 0.054473876953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 9.0, 10.0, 10.0, 25.0, 25.0, 31.0, 60.0, 100.0, 141.0, 226.0, 422.0, 995.0, 2859.0, 10734.0, 58370.0, 747966.0, 3235994.0, 111936.0, 17419.0, 4184.0, 1400.0, 611.0, 341.0, 177.0, 105.0, 58.0, 26.0, 19.0, 6.0, 7.0, 6.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3242759704589844, -0.31505584716796875, -0.3058357238769531, -0.2966156005859375, -0.2873954772949219, -0.27817535400390625, -0.2689552307128906, -0.259735107421875, -0.2505149841308594, -0.24129486083984375, -0.23207473754882812, -0.2228546142578125, -0.21363449096679688, -0.20441436767578125, -0.19519424438476562, -0.18597412109375, -0.17675399780273438, -0.16753387451171875, -0.15831375122070312, -0.1490936279296875, -0.13987350463867188, -0.13065338134765625, -0.12143325805664062, -0.112213134765625, -0.10299301147460938, -0.09377288818359375, -0.08455276489257812, -0.0753326416015625, -0.06611251831054688, -0.05689239501953125, -0.047672271728515625, -0.0384521484375, -0.029232025146484375, -0.02001190185546875, -0.010791778564453125, -0.0015716552734375, 0.007648468017578125, 0.01686859130859375, 0.026088714599609375, 0.035308837890625, 0.044528961181640625, 0.05374908447265625, 0.06296920776367188, 0.0721893310546875, 0.08140945434570312, 0.09062957763671875, 0.09984970092773438, 0.10906982421875, 0.11828994750976562, 0.12751007080078125, 0.13673019409179688, 0.1459503173828125, 0.15517044067382812, 0.16439056396484375, 0.17361068725585938, 0.182830810546875, 0.19205093383789062, 0.20127105712890625, 0.21049118041992188, 0.2197113037109375, 0.22893142700195312, 0.23815155029296875, 0.24737167358398438, 0.256591796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 11.0, 11.0, 14.0, 19.0, 15.0, 28.0, 35.0, 53.0, 70.0, 91.0, 121.0, 135.0, 186.0, 332.0, 920.0, 935.0, 352.0, 227.0, 137.0, 109.0, 65.0, 50.0, 38.0, 25.0, 23.0, 19.0, 14.0, 8.0, 8.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.050018310546875, -0.04816579818725586, -0.04631328582763672, -0.04446077346801758, -0.04260826110839844, -0.0407557487487793, -0.038903236389160156, -0.037050724029541016, -0.035198211669921875, -0.033345699310302734, -0.031493186950683594, -0.029640674591064453, -0.027788162231445312, -0.025935649871826172, -0.02408313751220703, -0.02223062515258789, -0.02037811279296875, -0.01852560043334961, -0.01667308807373047, -0.014820575714111328, -0.012968063354492188, -0.011115550994873047, -0.009263038635253906, -0.007410526275634766, -0.005558013916015625, -0.0037055015563964844, -0.0018529891967773438, -4.76837158203125e-07, 0.0018520355224609375, 0.003704547882080078, 0.005557060241699219, 0.007409572601318359, 0.0092620849609375, 0.01111459732055664, 0.012967109680175781, 0.014819622039794922, 0.016672134399414062, 0.018524646759033203, 0.020377159118652344, 0.022229671478271484, 0.024082183837890625, 0.025934696197509766, 0.027787208557128906, 0.029639720916748047, 0.03149223327636719, 0.03334474563598633, 0.03519725799560547, 0.03704977035522461, 0.03890228271484375, 0.04075479507446289, 0.04260730743408203, 0.04445981979370117, 0.04631233215332031, 0.04816484451293945, 0.050017356872558594, 0.051869869232177734, 0.053722381591796875, 0.055574893951416016, 0.057427406311035156, 0.0592799186706543, 0.06113243103027344, 0.06298494338989258, 0.06483745574951172, 0.06668996810913086, 0.06854248046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 10.0, 30.0, 63.0, 273.0, 464.0, 133.0, 22.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265873432159424, -2.2208850383758545, -2.175896644592285, -2.130908250808716, -2.0859198570251465, -2.040931463241577, -1.9959430694580078, -1.9509546756744385, -1.9059662818908691, -1.8609778881072998, -1.8159894943237305, -1.7710011005401611, -1.7260127067565918, -1.6810243129730225, -1.6360359191894531, -1.5910475254058838, -1.5460591316223145, -1.5010707378387451, -1.4560823440551758, -1.4110939502716064, -1.366105556488037, -1.3211171627044678, -1.2761287689208984, -1.231140375137329, -1.1861518621444702, -1.1411634683609009, -1.0961750745773315, -1.0511866807937622, -1.0061982870101929, -0.9612098932266235, -0.9162214994430542, -0.8712331056594849, -0.8262446522712708, -0.7812562584877014, -0.7362678647041321, -0.6912794709205627, -0.6462910771369934, -0.6013026833534241, -0.55631422996521, -0.5113258361816406, -0.4663374722003937, -0.42134907841682434, -0.376360684633255, -0.3313722610473633, -0.28638386726379395, -0.2413954883813858, -0.19640707969665527, -0.15141868591308594, -0.1064302921295166, -0.06144189462065697, -0.016453497111797333, 0.0285349041223526, 0.07352329790592194, 0.11851169168949127, 0.1635001003742218, 0.20848849415779114, 0.2534768879413605, 0.2984652817249298, 0.34345367550849915, 0.38844209909439087, 0.4334304928779602, 0.47841888666152954, 0.5234072804450989, 0.5683956742286682, 0.6133840680122375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 6.0, 7.0, 5.0, 10.0, 4.0, 17.0, 15.0, 16.0, 18.0, 23.0, 30.0, 32.0, 34.0, 44.0, 49.0, 58.0, 33.0, 50.0, 55.0, 47.0, 51.0, 50.0, 42.0, 41.0, 42.0, 35.0, 27.0, 26.0, 29.0, 25.0, 16.0, 14.0, 13.0, 10.0, 10.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2884256839752197, -0.27962765097618103, -0.27082961797714233, -0.26203158497810364, -0.25323355197906494, -0.24443553388118744, -0.23563751578330994, -0.22683948278427124, -0.21804144978523254, -0.20924341678619385, -0.20044538378715515, -0.19164736568927765, -0.18284933269023895, -0.17405129969120026, -0.16525328159332275, -0.15645524859428406, -0.14765721559524536, -0.13885918259620667, -0.13006114959716797, -0.12126313149929047, -0.11246509850025177, -0.10366706550121307, -0.09486903995275497, -0.08607101440429688, -0.07727298140525818, -0.06847494840621948, -0.05967692285776138, -0.050878893584012985, -0.04208086431026459, -0.03328283503651619, -0.024484805762767792, -0.015686776489019394, -0.006888747215270996, 0.0019092820584774017, 0.0107073113322258, 0.019505340605974197, 0.028303369879722595, 0.03710139915347099, 0.04589942842721939, 0.05469745770096779, 0.06349548697471619, 0.07229351997375488, 0.08109154552221298, 0.08988957107067108, 0.09868760406970978, 0.10748563706874847, 0.11628366261720657, 0.12508168816566467, 0.13387972116470337, 0.14267775416374207, 0.15147578716278076, 0.16027380526065826, 0.16907183825969696, 0.17786987125873566, 0.18666788935661316, 0.19546592235565186, 0.20426395535469055, 0.21306198835372925, 0.22186002135276794, 0.23065803945064545, 0.23945607244968414, 0.24825410544872284, 0.25705212354660034, 0.26585015654563904, 0.27464818954467773]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 9.0, 16.0, 20.0, 24.0, 28.0, 41.0, 61.0, 94.0, 143.0, 182.0, 276.0, 430.0, 718.0, 1127.0, 1895.0, 3165.0, 5632.0, 10712.0, 24717.0, 239072.0, 698539.0, 32921.0, 12953.0, 6490.0, 3557.0, 2062.0, 1282.0, 809.0, 495.0, 333.0, 238.0, 148.0, 102.0, 73.0, 49.0, 47.0, 33.0, 13.0, 15.0, 6.0, 9.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.235595703125, -0.22869110107421875, -0.2217864990234375, -0.21488189697265625, -0.207977294921875, -0.20107269287109375, -0.1941680908203125, -0.18726348876953125, -0.18035888671875, -0.17345428466796875, -0.1665496826171875, -0.15964508056640625, -0.152740478515625, -0.14583587646484375, -0.1389312744140625, -0.13202667236328125, -0.1251220703125, -0.11821746826171875, -0.1113128662109375, -0.10440826416015625, -0.097503662109375, -0.09059906005859375, -0.0836944580078125, -0.07678985595703125, -0.06988525390625, -0.06298065185546875, -0.0560760498046875, -0.04917144775390625, -0.042266845703125, -0.03536224365234375, -0.0284576416015625, -0.02155303955078125, -0.0146484375, -0.00774383544921875, -0.0008392333984375, 0.00606536865234375, 0.012969970703125, 0.01987457275390625, 0.0267791748046875, 0.03368377685546875, 0.04058837890625, 0.04749298095703125, 0.0543975830078125, 0.06130218505859375, 0.068206787109375, 0.07511138916015625, 0.0820159912109375, 0.08892059326171875, 0.0958251953125, 0.10272979736328125, 0.1096343994140625, 0.11653900146484375, 0.123443603515625, 0.13034820556640625, 0.1372528076171875, 0.14415740966796875, 0.15106201171875, 0.15796661376953125, 0.1648712158203125, 0.17177581787109375, 0.178680419921875, 0.18558502197265625, 0.1924896240234375, 0.19939422607421875, 0.206298828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 13.0, 4.0, 7.0, 21.0, 36.0, 94.0, 259.0, 301.0, 126.0, 43.0, 12.0, 11.0, 5.0, 5.0, 4.0, 5.0, 4.0, 6.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0372314453125, -0.036036014556884766, -0.03484058380126953, -0.0336451530456543, -0.03244972229003906, -0.03125429153442383, -0.030058860778808594, -0.02886343002319336, -0.027667999267578125, -0.02647256851196289, -0.025277137756347656, -0.024081707000732422, -0.022886276245117188, -0.021690845489501953, -0.02049541473388672, -0.019299983978271484, -0.01810455322265625, -0.016909122467041016, -0.01571369171142578, -0.014518260955810547, -0.013322830200195312, -0.012127399444580078, -0.010931968688964844, -0.00973653793334961, -0.008541107177734375, -0.007345676422119141, -0.006150245666503906, -0.004954814910888672, -0.0037593841552734375, -0.002563953399658203, -0.0013685226440429688, -0.00017309188842773438, 0.0010223388671875, 0.0022177696228027344, 0.0034132003784179688, 0.004608631134033203, 0.0058040618896484375, 0.006999492645263672, 0.008194923400878906, 0.00939035415649414, 0.010585784912109375, 0.01178121566772461, 0.012976646423339844, 0.014172077178955078, 0.015367507934570312, 0.016562938690185547, 0.01775836944580078, 0.018953800201416016, 0.02014923095703125, 0.021344661712646484, 0.02254009246826172, 0.023735523223876953, 0.024930953979492188, 0.026126384735107422, 0.027321815490722656, 0.02851724624633789, 0.029712677001953125, 0.03090810775756836, 0.032103538513183594, 0.03329896926879883, 0.03449440002441406, 0.0356898307800293, 0.03688526153564453, 0.038080692291259766, 0.039276123046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 18.0, 15.0, 26.0, 35.0, 65.0, 117.0, 187.0, 409.0, 1077.0, 3971.0, 37585.0, 923216.0, 73859.0, 5615.0, 1309.0, 500.0, 225.0, 120.0, 72.0, 40.0, 19.0, 14.0, 14.0, 9.0, 5.0, 9.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58642578125, -0.56591796875, -0.54541015625, -0.52490234375, -0.50439453125, -0.48388671875, -0.46337890625, -0.44287109375, -0.42236328125, -0.40185546875, -0.38134765625, -0.36083984375, -0.34033203125, -0.31982421875, -0.29931640625, -0.27880859375, -0.25830078125, -0.23779296875, -0.21728515625, -0.19677734375, -0.17626953125, -0.15576171875, -0.13525390625, -0.11474609375, -0.09423828125, -0.07373046875, -0.05322265625, -0.03271484375, -0.01220703125, 0.00830078125, 0.02880859375, 0.04931640625, 0.06982421875, 0.09033203125, 0.11083984375, 0.13134765625, 0.15185546875, 0.17236328125, 0.19287109375, 0.21337890625, 0.23388671875, 0.25439453125, 0.27490234375, 0.29541015625, 0.31591796875, 0.33642578125, 0.35693359375, 0.37744140625, 0.39794921875, 0.41845703125, 0.43896484375, 0.45947265625, 0.47998046875, 0.50048828125, 0.52099609375, 0.54150390625, 0.56201171875, 0.58251953125, 0.60302734375, 0.62353515625, 0.64404296875, 0.66455078125, 0.68505859375, 0.70556640625, 0.72607421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 11.0, 15.0, 12.0, 12.0, 24.0, 27.0, 19.0, 29.0, 32.0, 30.0, 39.0, 34.0, 41.0, 44.0, 52.0, 44.0, 34.0, 52.0, 45.0, 39.0, 35.0, 27.0, 35.0, 34.0, 26.0, 29.0, 26.0, 21.0, 19.0, 17.0, 16.0, 12.0, 8.0, 8.0, 8.0, 3.0, 7.0, 1.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1605224609375, -0.15567398071289062, -0.15082550048828125, -0.14597702026367188, -0.1411285400390625, -0.13628005981445312, -0.13143157958984375, -0.12658309936523438, -0.121734619140625, -0.11688613891601562, -0.11203765869140625, -0.10718917846679688, -0.1023406982421875, -0.09749221801757812, -0.09264373779296875, -0.08779525756835938, -0.08294677734375, -0.07809829711914062, -0.07324981689453125, -0.06840133666992188, -0.0635528564453125, -0.058704376220703125, -0.05385589599609375, -0.049007415771484375, -0.044158935546875, -0.039310455322265625, -0.03446197509765625, -0.029613494873046875, -0.0247650146484375, -0.019916534423828125, -0.01506805419921875, -0.010219573974609375, -0.00537109375, -0.000522613525390625, 0.00432586669921875, 0.009174346923828125, 0.0140228271484375, 0.018871307373046875, 0.02371978759765625, 0.028568267822265625, 0.033416748046875, 0.038265228271484375, 0.04311370849609375, 0.047962188720703125, 0.0528106689453125, 0.057659149169921875, 0.06250762939453125, 0.06735610961914062, 0.07220458984375, 0.07705307006835938, 0.08190155029296875, 0.08675003051757812, 0.0915985107421875, 0.09644699096679688, 0.10129547119140625, 0.10614395141601562, 0.110992431640625, 0.11584091186523438, 0.12068939208984375, 0.12553787231445312, 0.1303863525390625, 0.13523483276367188, 0.14008331298828125, 0.14493179321289062, 0.1497802734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 9.0, 9.0, 19.0, 21.0, 33.0, 39.0, 68.0, 118.0, 150.0, 275.0, 580.0, 1204.0, 3240.0, 13415.0, 339894.0, 666043.0, 16954.0, 3655.0, 1346.0, 610.0, 329.0, 197.0, 123.0, 67.0, 31.0, 30.0, 18.0, 13.0, 15.0, 10.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.404296875, -0.3912811279296875, -0.378265380859375, -0.3652496337890625, -0.35223388671875, -0.3392181396484375, -0.326202392578125, -0.3131866455078125, -0.3001708984375, -0.2871551513671875, -0.274139404296875, -0.2611236572265625, -0.24810791015625, -0.2350921630859375, -0.222076416015625, -0.2090606689453125, -0.196044921875, -0.1830291748046875, -0.170013427734375, -0.1569976806640625, -0.14398193359375, -0.1309661865234375, -0.117950439453125, -0.1049346923828125, -0.0919189453125, -0.0789031982421875, -0.065887451171875, -0.0528717041015625, -0.03985595703125, -0.0268402099609375, -0.013824462890625, -0.0008087158203125, 0.01220703125, 0.0252227783203125, 0.038238525390625, 0.0512542724609375, 0.06427001953125, 0.0772857666015625, 0.090301513671875, 0.1033172607421875, 0.1163330078125, 0.1293487548828125, 0.142364501953125, 0.1553802490234375, 0.16839599609375, 0.1814117431640625, 0.194427490234375, 0.2074432373046875, 0.220458984375, 0.2334747314453125, 0.246490478515625, 0.2595062255859375, 0.27252197265625, 0.2855377197265625, 0.298553466796875, 0.3115692138671875, 0.3245849609375, 0.3376007080078125, 0.350616455078125, 0.3636322021484375, 0.37664794921875, 0.3896636962890625, 0.402679443359375, 0.4156951904296875, 0.4287109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 5.0, 4.0, 8.0, 7.0, 15.0, 27.0, 38.0, 39.0, 67.0, 84.0, 141.0, 137.0, 113.0, 79.0, 58.0, 49.0, 21.0, 18.0, 22.0, 11.0, 10.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005664825439453125, -0.000547848641872406, -0.0005292147397994995, -0.000510580837726593, -0.0004919469356536865, -0.00047331303358078003, -0.00045467913150787354, -0.00043604522943496704, -0.00041741132736206055, -0.00039877742528915405, -0.00038014352321624756, -0.00036150962114334106, -0.00034287571907043457, -0.0003242418169975281, -0.0003056079149246216, -0.0002869740128517151, -0.0002683401107788086, -0.0002497062087059021, -0.0002310723066329956, -0.0002124384045600891, -0.00019380450248718262, -0.00017517060041427612, -0.00015653669834136963, -0.00013790279626846313, -0.00011926889419555664, -0.00010063499212265015, -8.200109004974365e-05, -6.336718797683716e-05, -4.4733285903930664e-05, -2.609938383102417e-05, -7.465481758117676e-06, 1.1168420314788818e-05, 2.9802322387695312e-05, 4.843622446060181e-05, 6.70701265335083e-05, 8.57040286064148e-05, 0.00010433793067932129, 0.00012297183275222778, 0.00014160573482513428, 0.00016023963689804077, 0.00017887353897094727, 0.00019750744104385376, 0.00021614134311676025, 0.00023477524518966675, 0.00025340914726257324, 0.00027204304933547974, 0.00029067695140838623, 0.0003093108534812927, 0.0003279447555541992, 0.0003465786576271057, 0.0003652125597000122, 0.0003838464617729187, 0.0004024803638458252, 0.0004211142659187317, 0.0004397481679916382, 0.0004583820700645447, 0.00047701597213745117, 0.0004956498742103577, 0.0005142837762832642, 0.0005329176783561707, 0.0005515515804290771, 0.0005701854825019836, 0.0005888193845748901, 0.0006074532866477966, 0.0006260871887207031]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 14.0, 19.0, 38.0, 56.0, 89.0, 168.0, 364.0, 1101.0, 3993.0, 26082.0, 671323.0, 323454.0, 17249.0, 3019.0, 849.0, 360.0, 158.0, 84.0, 46.0, 33.0, 22.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2352294921875, -0.22278785705566406, -0.21034622192382812, -0.1979045867919922, -0.18546295166015625, -0.1730213165283203, -0.16057968139648438, -0.14813804626464844, -0.1356964111328125, -0.12325477600097656, -0.11081314086914062, -0.09837150573730469, -0.08592987060546875, -0.07348823547363281, -0.061046600341796875, -0.04860496520996094, -0.036163330078125, -0.023721694946289062, -0.011280059814453125, 0.0011615753173828125, 0.01360321044921875, 0.026044845581054688, 0.038486480712890625, 0.05092811584472656, 0.0633697509765625, 0.07581138610839844, 0.08825302124023438, 0.10069465637207031, 0.11313629150390625, 0.1255779266357422, 0.13801956176757812, 0.15046119689941406, 0.16290283203125, 0.17534446716308594, 0.18778610229492188, 0.2002277374267578, 0.21266937255859375, 0.2251110076904297, 0.23755264282226562, 0.24999427795410156, 0.2624359130859375, 0.27487754821777344, 0.2873191833496094, 0.2997608184814453, 0.31220245361328125, 0.3246440887451172, 0.3370857238769531, 0.34952735900878906, 0.361968994140625, 0.37441062927246094, 0.3868522644042969, 0.3992938995361328, 0.41173553466796875, 0.4241771697998047, 0.4366188049316406, 0.44906044006347656, 0.4615020751953125, 0.47394371032714844, 0.4863853454589844, 0.4988269805908203, 0.5112686157226562, 0.5237102508544922, 0.5361518859863281, 0.5485935211181641, 0.56103515625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 9.0, 11.0, 20.0, 26.0, 39.0, 54.0, 97.0, 156.0, 186.0, 131.0, 91.0, 51.0, 45.0, 21.0, 16.0, 15.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1812744140625, -0.1738414764404297, -0.16640853881835938, -0.15897560119628906, -0.15154266357421875, -0.14410972595214844, -0.13667678833007812, -0.1292438507080078, -0.1218109130859375, -0.11437797546386719, -0.10694503784179688, -0.09951210021972656, -0.09207916259765625, -0.08464622497558594, -0.07721328735351562, -0.06978034973144531, -0.062347412109375, -0.05491447448730469, -0.047481536865234375, -0.04004859924316406, -0.03261566162109375, -0.025182723999023438, -0.017749786376953125, -0.010316848754882812, -0.0028839111328125, 0.0045490264892578125, 0.011981964111328125, 0.019414901733398438, 0.02684783935546875, 0.03428077697753906, 0.041713714599609375, 0.04914665222167969, 0.05657958984375, 0.06401252746582031, 0.07144546508789062, 0.07887840270996094, 0.08631134033203125, 0.09374427795410156, 0.10117721557617188, 0.10861015319824219, 0.1160430908203125, 0.12347602844238281, 0.13090896606445312, 0.13834190368652344, 0.14577484130859375, 0.15320777893066406, 0.16064071655273438, 0.1680736541748047, 0.175506591796875, 0.1829395294189453, 0.19037246704101562, 0.19780540466308594, 0.20523834228515625, 0.21267127990722656, 0.22010421752929688, 0.2275371551513672, 0.2349700927734375, 0.2424030303955078, 0.24983596801757812, 0.25726890563964844, 0.26470184326171875, 0.27213478088378906, 0.2795677185058594, 0.2870006561279297, 0.29443359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 5.0, 10.0, 29.0, 73.0, 301.0, 395.0, 105.0, 32.0, 16.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.940474033355713, -5.80599308013916, -5.671512126922607, -5.5370306968688965, -5.402549743652344, -5.268068790435791, -5.133587837219238, -4.9991068840026855, -4.864625930786133, -4.73014497756958, -4.595664024353027, -4.461182594299316, -4.326701641082764, -4.192220687866211, -4.057739734649658, -3.9232587814331055, -3.7887773513793945, -3.654296398162842, -3.51981520652771, -3.3853342533111572, -3.2508530616760254, -3.1163721084594727, -2.98189115524292, -2.847410202026367, -2.7129290103912354, -2.5784480571746826, -2.443966865539551, -2.309485912322998, -2.1750049591064453, -2.0405237674713135, -1.9060428142547607, -1.7715617418289185, -1.6370806694030762, -1.5025995969772339, -1.3681185245513916, -1.2336375713348389, -1.0991564989089966, -0.9646754264831543, -0.8301944136619568, -0.6957134008407593, -0.561232328414917, -0.4267512857913971, -0.2922702431678772, -0.1577892005443573, -0.023308157920837402, 0.11117291450500488, 0.2456539273262024, 0.3801349401473999, 0.5146160125732422, 0.6490970849990845, 0.783578097820282, 0.9180591106414795, 1.0525401830673218, 1.187021255493164, 1.3215022087097168, 1.455983281135559, 1.5904643535614014, 1.7249454259872437, 1.859426498413086, 1.9939074516296387, 2.1283884048461914, 2.2628695964813232, 2.397350549697876, 2.531831741333008, 2.6663126945495605]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 9.0, 9.0, 10.0, 17.0, 23.0, 35.0, 58.0, 103.0, 132.0, 171.0, 144.0, 94.0, 53.0, 43.0, 17.0, 12.0, 9.0, 5.0, 9.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8885433673858643, -2.7938334941864014, -2.6991233825683594, -2.6044135093688965, -2.5097036361694336, -2.4149937629699707, -2.320283889770508, -2.225573778152466, -2.130863904953003, -2.03615403175354, -1.9414440393447876, -1.8467340469360352, -1.7520241737365723, -1.6573143005371094, -1.562604308128357, -1.4678943157196045, -1.3731844425201416, -1.2784745693206787, -1.1837645769119263, -1.0890545845031738, -0.9943447113037109, -0.8996347784996033, -0.8049248456954956, -0.7102149128913879, -0.6155049800872803, -0.5207950472831726, -0.42608511447906494, -0.3313751816749573, -0.2366652488708496, -0.14195531606674194, -0.04724538326263428, 0.04746454954147339, 0.14217472076416016, 0.23688465356826782, 0.3315945863723755, 0.42630451917648315, 0.5210144519805908, 0.6157243847846985, 0.7104343175888062, 0.8051442503929138, 0.8998541831970215, 0.9945641160011292, 1.0892740488052368, 1.1839840412139893, 1.2786939144134521, 1.373403787612915, 1.4681137800216675, 1.56282377243042, 1.6575336456298828, 1.7522435188293457, 1.8469535112380981, 1.9416635036468506, 2.0363733768463135, 2.1310832500457764, 2.2257933616638184, 2.3205032348632812, 2.415213108062744, 2.509922981262207, 2.60463285446167, 2.699342966079712, 2.794052839279175, 2.8887627124786377, 2.9834728240966797, 3.0781826972961426, 3.1728925704956055]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 7.0, 13.0, 12.0, 15.0, 20.0, 31.0, 23.0, 80.0, 393.0, 7879.0, 4106897.0, 76392.0, 2050.0, 260.0, 71.0, 34.0, 16.0, 22.0, 10.0, 9.0, 8.0, 2.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.86639404296875, -1.7991943359375, -1.73199462890625, -1.664794921875, -1.59759521484375, -1.5303955078125, -1.46319580078125, -1.39599609375, -1.32879638671875, -1.2615966796875, -1.19439697265625, -1.127197265625, -1.05999755859375, -0.9927978515625, -0.92559814453125, -0.8583984375, -0.79119873046875, -0.7239990234375, -0.65679931640625, -0.589599609375, -0.52239990234375, -0.4552001953125, -0.38800048828125, -0.32080078125, -0.25360107421875, -0.1864013671875, -0.11920166015625, -0.052001953125, 0.01519775390625, 0.0823974609375, 0.14959716796875, 0.216796875, 0.28399658203125, 0.3511962890625, 0.41839599609375, 0.485595703125, 0.55279541015625, 0.6199951171875, 0.68719482421875, 0.75439453125, 0.82159423828125, 0.8887939453125, 0.95599365234375, 1.023193359375, 1.09039306640625, 1.1575927734375, 1.22479248046875, 1.2919921875, 1.35919189453125, 1.4263916015625, 1.49359130859375, 1.560791015625, 1.62799072265625, 1.6951904296875, 1.76239013671875, 1.82958984375, 1.89678955078125, 1.9639892578125, 2.03118896484375, 2.098388671875, 2.16558837890625, 2.2327880859375, 2.29998779296875, 2.3671875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 10.0, 9.0, 5.0, 11.0, 13.0, 25.0, 35.0, 59.0, 122.0, 129.0, 149.0, 126.0, 102.0, 59.0, 31.0, 21.0, 8.0, 10.0, 7.0, 6.0, 13.0, 2.0, 4.0, 6.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0214691162109375, -0.020688533782958984, -0.01990795135498047, -0.019127368927001953, -0.018346786499023438, -0.017566204071044922, -0.016785621643066406, -0.01600503921508789, -0.015224456787109375, -0.01444387435913086, -0.013663291931152344, -0.012882709503173828, -0.012102127075195312, -0.011321544647216797, -0.010540962219238281, -0.009760379791259766, -0.00897979736328125, -0.008199214935302734, -0.007418632507324219, -0.006638050079345703, -0.0058574676513671875, -0.005076885223388672, -0.004296302795410156, -0.0035157203674316406, -0.002735137939453125, -0.0019545555114746094, -0.0011739730834960938, -0.0003933906555175781, 0.0003871917724609375, 0.0011677742004394531, 0.0019483566284179688, 0.0027289390563964844, 0.003509521484375, 0.004290103912353516, 0.005070686340332031, 0.005851268768310547, 0.0066318511962890625, 0.007412433624267578, 0.008193016052246094, 0.00897359848022461, 0.009754180908203125, 0.01053476333618164, 0.011315345764160156, 0.012095928192138672, 0.012876510620117188, 0.013657093048095703, 0.014437675476074219, 0.015218257904052734, 0.01599884033203125, 0.016779422760009766, 0.01756000518798828, 0.018340587615966797, 0.019121170043945312, 0.019901752471923828, 0.020682334899902344, 0.02146291732788086, 0.022243499755859375, 0.02302408218383789, 0.023804664611816406, 0.024585247039794922, 0.025365829467773438, 0.026146411895751953, 0.02692699432373047, 0.027707576751708984, 0.0284881591796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 12.0, 16.0, 37.0, 50.0, 82.0, 209.0, 428.0, 1089.0, 3107.0, 12992.0, 115218.0, 3926190.0, 117190.0, 12690.0, 3022.0, 990.0, 440.0, 216.0, 139.0, 68.0, 39.0, 22.0, 18.0, 9.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29833984375, -0.2812957763671875, -0.264251708984375, -0.2472076416015625, -0.23016357421875, -0.2131195068359375, -0.196075439453125, -0.1790313720703125, -0.1619873046875, -0.1449432373046875, -0.127899169921875, -0.1108551025390625, -0.09381103515625, -0.0767669677734375, -0.059722900390625, -0.0426788330078125, -0.025634765625, -0.0085906982421875, 0.008453369140625, 0.0254974365234375, 0.04254150390625, 0.0595855712890625, 0.076629638671875, 0.0936737060546875, 0.1107177734375, 0.1277618408203125, 0.144805908203125, 0.1618499755859375, 0.17889404296875, 0.1959381103515625, 0.212982177734375, 0.2300262451171875, 0.2470703125, 0.2641143798828125, 0.281158447265625, 0.2982025146484375, 0.31524658203125, 0.3322906494140625, 0.349334716796875, 0.3663787841796875, 0.3834228515625, 0.4004669189453125, 0.417510986328125, 0.4345550537109375, 0.45159912109375, 0.4686431884765625, 0.485687255859375, 0.5027313232421875, 0.519775390625, 0.5368194580078125, 0.553863525390625, 0.5709075927734375, 0.58795166015625, 0.6049957275390625, 0.622039794921875, 0.6390838623046875, 0.6561279296875, 0.6731719970703125, 0.690216064453125, 0.7072601318359375, 0.72430419921875, 0.7413482666015625, 0.758392333984375, 0.7754364013671875, 0.79248046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 8.0, 5.0, 8.0, 11.0, 18.0, 21.0, 36.0, 56.0, 76.0, 135.0, 297.0, 1446.0, 1337.0, 308.0, 101.0, 79.0, 32.0, 26.0, 16.0, 13.0, 10.0, 5.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052032470703125, -0.050295352935791016, -0.04855823516845703, -0.04682111740112305, -0.04508399963378906, -0.04334688186645508, -0.041609764099121094, -0.03987264633178711, -0.038135528564453125, -0.03639841079711914, -0.034661293029785156, -0.03292417526245117, -0.031187057495117188, -0.029449939727783203, -0.02771282196044922, -0.025975704193115234, -0.02423858642578125, -0.022501468658447266, -0.02076435089111328, -0.019027233123779297, -0.017290115356445312, -0.015552997589111328, -0.013815879821777344, -0.01207876205444336, -0.010341644287109375, -0.00860452651977539, -0.006867408752441406, -0.005130290985107422, -0.0033931732177734375, -0.0016560554504394531, 8.106231689453125e-05, 0.0018181800842285156, 0.0035552978515625, 0.005292415618896484, 0.007029533386230469, 0.008766651153564453, 0.010503768920898438, 0.012240886688232422, 0.013978004455566406, 0.01571512222290039, 0.017452239990234375, 0.01918935775756836, 0.020926475524902344, 0.022663593292236328, 0.024400711059570312, 0.026137828826904297, 0.02787494659423828, 0.029612064361572266, 0.03134918212890625, 0.033086299896240234, 0.03482341766357422, 0.0365605354309082, 0.03829765319824219, 0.04003477096557617, 0.041771888732910156, 0.04350900650024414, 0.045246124267578125, 0.04698324203491211, 0.048720359802246094, 0.05045747756958008, 0.05219459533691406, 0.05393171310424805, 0.05566883087158203, 0.057405948638916016, 0.05914306640625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [15.0, 279.0, 681.0, 33.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12057021260261536, -0.06381553411483765, -0.0070608556270599365, 0.04969382286071777, 0.10644850134849548, 0.1632031798362732, 0.2199578583240509, 0.2767125368118286, 0.3334672152996063, 0.39022189378738403, 0.44697657227516174, 0.5037312507629395, 0.5604859590530396, 0.6172406077384949, 0.6739952564239502, 0.7307499647140503, 0.7875046730041504, 0.8442593812942505, 0.9010140299797058, 0.9577686786651611, 1.0145233869552612, 1.0712780952453613, 1.1280326843261719, 1.184787392616272, 1.241542100906372, 1.2982968091964722, 1.3550515174865723, 1.4118061065673828, 1.468560814857483, 1.525315523147583, 1.5820701122283936, 1.6388248205184937, 1.6955795288085938, 1.7523342370986938, 1.809088945388794, 1.8658435344696045, 1.9225982427597046, 1.9793529510498047, 2.0361075401306152, 2.092862367630005, 2.1496169567108154, 2.206371545791626, 2.2631263732910156, 2.319880962371826, 2.3766355514526367, 2.4333903789520264, 2.490144968032837, 2.5468997955322266, 2.603654384613037, 2.6604089736938477, 2.7171638011932373, 2.773918390274048, 2.8306732177734375, 2.887427806854248, 2.9441823959350586, 3.0009372234344482, 3.057691812515259, 3.1144464015960693, 3.171201229095459, 3.2279558181762695, 3.28471040725708, 3.3414652347564697, 3.3982198238372803, 3.45497465133667, 3.5117292404174805]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 7.0, 8.0, 11.0, 13.0, 27.0, 22.0, 47.0, 58.0, 85.0, 92.0, 106.0, 82.0, 95.0, 93.0, 72.0, 44.0, 20.0, 20.0, 20.0, 14.0, 10.0, 5.0, 6.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.28923821449279785, -0.2812667489051819, -0.27329525351524353, -0.26532378792762756, -0.2573522925376892, -0.24938082695007324, -0.24140936136245728, -0.23343788087368011, -0.22546640038490295, -0.2174949198961258, -0.20952343940734863, -0.20155197381973267, -0.1935804933309555, -0.18560901284217834, -0.17763754725456238, -0.16966606676578522, -0.16169458627700806, -0.1537231057882309, -0.14575162529945374, -0.13778015971183777, -0.1298086792230606, -0.12183719873428345, -0.11386572569608688, -0.10589425265789032, -0.09792277216911316, -0.089951291680336, -0.08197981864213943, -0.07400834560394287, -0.06603686511516571, -0.05806538835167885, -0.050093911588191986, -0.042122434824705124, -0.03415095806121826, -0.0261794812977314, -0.018208004534244537, -0.010236527770757675, -0.002265051007270813, 0.005706425756216049, 0.013677902519702911, 0.021649379283189774, 0.029620856046676636, 0.0375923328101635, 0.04556380957365036, 0.05353528633713722, 0.061506763100624084, 0.06947824358940125, 0.07744971662759781, 0.08542118966579437, 0.09339267015457153, 0.1013641506433487, 0.10933562368154526, 0.11730709671974182, 0.12527857720851898, 0.13325005769729614, 0.1412215232849121, 0.14919300377368927, 0.15716448426246643, 0.1651359647512436, 0.17310744524002075, 0.18107891082763672, 0.18905039131641388, 0.19702187180519104, 0.204993337392807, 0.21296481788158417, 0.22093629837036133]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 7.0, 17.0, 18.0, 47.0, 79.0, 191.0, 376.0, 999.0, 2362.0, 6714.0, 21573.0, 125753.0, 753310.0, 107041.0, 19969.0, 6178.0, 2276.0, 901.0, 355.0, 176.0, 99.0, 35.0, 30.0, 14.0, 8.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.225341796875, -0.216827392578125, -0.20831298828125, -0.199798583984375, -0.1912841796875, -0.182769775390625, -0.17425537109375, -0.165740966796875, -0.1572265625, -0.148712158203125, -0.14019775390625, -0.131683349609375, -0.1231689453125, -0.114654541015625, -0.10614013671875, -0.097625732421875, -0.089111328125, -0.080596923828125, -0.07208251953125, -0.063568115234375, -0.0550537109375, -0.046539306640625, -0.03802490234375, -0.029510498046875, -0.02099609375, -0.012481689453125, -0.00396728515625, 0.004547119140625, 0.0130615234375, 0.021575927734375, 0.03009033203125, 0.038604736328125, 0.047119140625, 0.055633544921875, 0.06414794921875, 0.072662353515625, 0.0811767578125, 0.089691162109375, 0.09820556640625, 0.106719970703125, 0.115234375, 0.123748779296875, 0.13226318359375, 0.140777587890625, 0.1492919921875, 0.157806396484375, 0.16632080078125, 0.174835205078125, 0.183349609375, 0.191864013671875, 0.20037841796875, 0.208892822265625, 0.2174072265625, 0.225921630859375, 0.23443603515625, 0.242950439453125, 0.25146484375, 0.259979248046875, 0.26849365234375, 0.277008056640625, 0.2855224609375, 0.294036865234375, 0.30255126953125, 0.311065673828125, 0.319580078125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 11.0, 6.0, 5.0, 5.0, 6.0, 13.0, 8.0, 17.0, 26.0, 47.0, 57.0, 74.0, 90.0, 94.0, 106.0, 106.0, 64.0, 71.0, 44.0, 39.0, 25.0, 14.0, 15.0, 7.0, 6.0, 5.0, 7.0, 7.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.016998291015625, -0.016397953033447266, -0.01579761505126953, -0.015197277069091797, -0.014596939086914062, -0.013996601104736328, -0.013396263122558594, -0.01279592514038086, -0.012195587158203125, -0.01159524917602539, -0.010994911193847656, -0.010394573211669922, -0.009794235229492188, -0.009193897247314453, -0.008593559265136719, -0.007993221282958984, -0.00739288330078125, -0.006792545318603516, -0.006192207336425781, -0.005591869354248047, -0.0049915313720703125, -0.004391193389892578, -0.0037908554077148438, -0.0031905174255371094, -0.002590179443359375, -0.0019898414611816406, -0.0013895034790039062, -0.0007891654968261719, -0.0001888275146484375, 0.0004115104675292969, 0.0010118484497070312, 0.0016121864318847656, 0.0022125244140625, 0.0028128623962402344, 0.0034132003784179688, 0.004013538360595703, 0.0046138763427734375, 0.005214214324951172, 0.005814552307128906, 0.006414890289306641, 0.007015228271484375, 0.007615566253662109, 0.008215904235839844, 0.008816242218017578, 0.009416580200195312, 0.010016918182373047, 0.010617256164550781, 0.011217594146728516, 0.01181793212890625, 0.012418270111083984, 0.013018608093261719, 0.013618946075439453, 0.014219284057617188, 0.014819622039794922, 0.015419960021972656, 0.01602029800415039, 0.016620635986328125, 0.01722097396850586, 0.017821311950683594, 0.018421649932861328, 0.019021987915039062, 0.019622325897216797, 0.02022266387939453, 0.020823001861572266, 0.02142333984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 6.0, 8.0, 10.0, 13.0, 22.0, 47.0, 143.0, 728.0, 7941.0, 646939.0, 386767.0, 5091.0, 556.0, 127.0, 28.0, 16.0, 9.0, 8.0, 8.0, 5.0, 4.0, 8.0, 9.0, 3.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.7470703125, -0.7278823852539062, -0.7086944580078125, -0.6895065307617188, -0.670318603515625, -0.6511306762695312, -0.6319427490234375, -0.6127548217773438, -0.59356689453125, -0.5743789672851562, -0.5551910400390625, -0.5360031127929688, -0.516815185546875, -0.49762725830078125, -0.4784393310546875, -0.45925140380859375, -0.4400634765625, -0.42087554931640625, -0.4016876220703125, -0.38249969482421875, -0.363311767578125, -0.34412384033203125, -0.3249359130859375, -0.30574798583984375, -0.28656005859375, -0.26737213134765625, -0.2481842041015625, -0.22899627685546875, -0.209808349609375, -0.19062042236328125, -0.1714324951171875, -0.15224456787109375, -0.133056640625, -0.11386871337890625, -0.0946807861328125, -0.07549285888671875, -0.056304931640625, -0.03711700439453125, -0.0179290771484375, 0.00125885009765625, 0.02044677734375, 0.03963470458984375, 0.0588226318359375, 0.07801055908203125, 0.097198486328125, 0.11638641357421875, 0.1355743408203125, 0.15476226806640625, 0.1739501953125, 0.19313812255859375, 0.2123260498046875, 0.23151397705078125, 0.250701904296875, 0.26988983154296875, 0.2890777587890625, 0.30826568603515625, 0.32745361328125, 0.34664154052734375, 0.3658294677734375, 0.38501739501953125, 0.404205322265625, 0.42339324951171875, 0.4425811767578125, 0.46176910400390625, 0.48095703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 9.0, 2.0, 5.0, 4.0, 6.0, 8.0, 9.0, 13.0, 13.0, 7.0, 13.0, 19.0, 24.0, 22.0, 22.0, 23.0, 35.0, 38.0, 38.0, 33.0, 36.0, 47.0, 53.0, 34.0, 45.0, 34.0, 45.0, 44.0, 31.0, 36.0, 30.0, 31.0, 29.0, 34.0, 23.0, 17.0, 20.0, 18.0, 9.0, 11.0, 9.0, 7.0, 2.0, 4.0, 3.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0850830078125, -0.0824737548828125, -0.079864501953125, -0.0772552490234375, -0.07464599609375, -0.0720367431640625, -0.069427490234375, -0.0668182373046875, -0.064208984375, -0.0615997314453125, -0.058990478515625, -0.0563812255859375, -0.05377197265625, -0.0511627197265625, -0.048553466796875, -0.0459442138671875, -0.0433349609375, -0.0407257080078125, -0.038116455078125, -0.0355072021484375, -0.03289794921875, -0.0302886962890625, -0.027679443359375, -0.0250701904296875, -0.0224609375, -0.0198516845703125, -0.017242431640625, -0.0146331787109375, -0.01202392578125, -0.0094146728515625, -0.006805419921875, -0.0041961669921875, -0.0015869140625, 0.0010223388671875, 0.003631591796875, 0.0062408447265625, 0.00885009765625, 0.0114593505859375, 0.014068603515625, 0.0166778564453125, 0.019287109375, 0.0218963623046875, 0.024505615234375, 0.0271148681640625, 0.02972412109375, 0.0323333740234375, 0.034942626953125, 0.0375518798828125, 0.0401611328125, 0.0427703857421875, 0.045379638671875, 0.0479888916015625, 0.05059814453125, 0.0532073974609375, 0.055816650390625, 0.0584259033203125, 0.06103515625, 0.0636444091796875, 0.066253662109375, 0.0688629150390625, 0.07147216796875, 0.0740814208984375, 0.076690673828125, 0.0792999267578125, 0.0819091796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 9.0, 8.0, 7.0, 22.0, 29.0, 56.0, 127.0, 468.0, 3414.0, 825038.0, 216589.0, 2222.0, 328.0, 91.0, 40.0, 31.0, 30.0, 6.0, 10.0, 2.0, 4.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0126953125, -0.9828338623046875, -0.952972412109375, -0.9231109619140625, -0.89324951171875, -0.8633880615234375, -0.833526611328125, -0.8036651611328125, -0.7738037109375, -0.7439422607421875, -0.714080810546875, -0.6842193603515625, -0.65435791015625, -0.6244964599609375, -0.594635009765625, -0.5647735595703125, -0.534912109375, -0.5050506591796875, -0.475189208984375, -0.4453277587890625, -0.41546630859375, -0.3856048583984375, -0.355743408203125, -0.3258819580078125, -0.2960205078125, -0.2661590576171875, -0.236297607421875, -0.2064361572265625, -0.17657470703125, -0.1467132568359375, -0.116851806640625, -0.0869903564453125, -0.05712890625, -0.0272674560546875, 0.002593994140625, 0.0324554443359375, 0.06231689453125, 0.0921783447265625, 0.122039794921875, 0.1519012451171875, 0.1817626953125, 0.2116241455078125, 0.241485595703125, 0.2713470458984375, 0.30120849609375, 0.3310699462890625, 0.360931396484375, 0.3907928466796875, 0.420654296875, 0.4505157470703125, 0.480377197265625, 0.5102386474609375, 0.54010009765625, 0.5699615478515625, 0.599822998046875, 0.6296844482421875, 0.6595458984375, 0.6894073486328125, 0.719268798828125, 0.7491302490234375, 0.77899169921875, 0.8088531494140625, 0.838714599609375, 0.8685760498046875, 0.8984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 2.0, 3.0, 5.0, 5.0, 10.0, 16.0, 9.0, 27.0, 31.0, 61.0, 181.0, 323.0, 138.0, 58.0, 30.0, 20.0, 20.0, 9.0, 6.0, 11.0, 8.0, 4.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010747909545898438, -0.0010394752025604248, -0.0010041594505310059, -0.0009688436985015869, -0.000933527946472168, -0.000898212194442749, -0.0008628964424133301, -0.0008275806903839111, -0.0007922649383544922, -0.0007569491863250732, -0.0007216334342956543, -0.0006863176822662354, -0.0006510019302368164, -0.0006156861782073975, -0.0005803704261779785, -0.0005450546741485596, -0.0005097389221191406, -0.0004744231700897217, -0.00043910741806030273, -0.0004037916660308838, -0.00036847591400146484, -0.0003331601619720459, -0.00029784440994262695, -0.000262528657913208, -0.00022721290588378906, -0.00019189715385437012, -0.00015658140182495117, -0.00012126564979553223, -8.594989776611328e-05, -5.0634145736694336e-05, -1.531839370727539e-05, 1.9997358322143555e-05, 5.53131103515625e-05, 9.062886238098145e-05, 0.0001259446144104004, 0.00016126036643981934, 0.00019657611846923828, 0.00023189187049865723, 0.00026720762252807617, 0.0003025233745574951, 0.00033783912658691406, 0.000373154878616333, 0.00040847063064575195, 0.0004437863826751709, 0.00047910213470458984, 0.0005144178867340088, 0.0005497336387634277, 0.0005850493907928467, 0.0006203651428222656, 0.0006556808948516846, 0.0006909966468811035, 0.0007263123989105225, 0.0007616281509399414, 0.0007969439029693604, 0.0008322596549987793, 0.0008675754070281982, 0.0009028911590576172, 0.0009382069110870361, 0.0009735226631164551, 0.001008838415145874, 0.001044154167175293, 0.001079469919204712, 0.0011147856712341309, 0.0011501014232635498, 0.0011854171752929688]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 12.0, 18.0, 39.0, 86.0, 225.0, 573.0, 2195.0, 12693.0, 437269.0, 576920.0, 15092.0, 2360.0, 660.0, 220.0, 84.0, 42.0, 20.0, 16.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.619140625, -0.6036758422851562, -0.5882110595703125, -0.5727462768554688, -0.557281494140625, -0.5418167114257812, -0.5263519287109375, -0.5108871459960938, -0.49542236328125, -0.47995758056640625, -0.4644927978515625, -0.44902801513671875, -0.433563232421875, -0.41809844970703125, -0.4026336669921875, -0.38716888427734375, -0.3717041015625, -0.35623931884765625, -0.3407745361328125, -0.32530975341796875, -0.309844970703125, -0.29438018798828125, -0.2789154052734375, -0.26345062255859375, -0.24798583984375, -0.23252105712890625, -0.2170562744140625, -0.20159149169921875, -0.186126708984375, -0.17066192626953125, -0.1551971435546875, -0.13973236083984375, -0.124267578125, -0.10880279541015625, -0.0933380126953125, -0.07787322998046875, -0.062408447265625, -0.04694366455078125, -0.0314788818359375, -0.01601409912109375, -0.00054931640625, 0.01491546630859375, 0.0303802490234375, 0.04584503173828125, 0.061309814453125, 0.07677459716796875, 0.0922393798828125, 0.10770416259765625, 0.1231689453125, 0.13863372802734375, 0.1540985107421875, 0.16956329345703125, 0.185028076171875, 0.20049285888671875, 0.2159576416015625, 0.23142242431640625, 0.24688720703125, 0.26235198974609375, 0.2778167724609375, 0.29328155517578125, 0.308746337890625, 0.32421112060546875, 0.3396759033203125, 0.35514068603515625, 0.37060546875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 11.0, 18.0, 19.0, 18.0, 29.0, 44.0, 50.0, 73.0, 72.0, 91.0, 85.0, 84.0, 82.0, 66.0, 42.0, 34.0, 36.0, 34.0, 15.0, 12.0, 13.0, 16.0, 4.0, 7.0, 5.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.1033935546875, -0.09981727600097656, -0.09624099731445312, -0.09266471862792969, -0.08908843994140625, -0.08551216125488281, -0.08193588256835938, -0.07835960388183594, -0.0747833251953125, -0.07120704650878906, -0.06763076782226562, -0.06405448913574219, -0.06047821044921875, -0.05690193176269531, -0.053325653076171875, -0.04974937438964844, -0.046173095703125, -0.04259681701660156, -0.039020538330078125, -0.03544425964355469, -0.03186798095703125, -0.028291702270507812, -0.024715423583984375, -0.021139144897460938, -0.0175628662109375, -0.013986587524414062, -0.010410308837890625, -0.0068340301513671875, -0.00325775146484375, 0.0003185272216796875, 0.003894805908203125, 0.0074710845947265625, 0.01104736328125, 0.014623641967773438, 0.018199920654296875, 0.021776199340820312, 0.02535247802734375, 0.028928756713867188, 0.032505035400390625, 0.03608131408691406, 0.0396575927734375, 0.04323387145996094, 0.046810150146484375, 0.05038642883300781, 0.05396270751953125, 0.05753898620605469, 0.061115264892578125, 0.06469154357910156, 0.068267822265625, 0.07184410095214844, 0.07542037963867188, 0.07899665832519531, 0.08257293701171875, 0.08614921569824219, 0.08972549438476562, 0.09330177307128906, 0.0968780517578125, 0.10045433044433594, 0.10403060913085938, 0.10760688781738281, 0.11118316650390625, 0.11475944519042969, 0.11833572387695312, 0.12191200256347656, 0.12548828125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 17.0, 39.0, 87.0, 261.0, 335.0, 163.0, 51.0, 19.0, 9.0, 8.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9462106823921204, -0.887650728225708, -0.8290907740592957, -0.7705308198928833, -0.7119709253311157, -0.6534109115600586, -0.594851016998291, -0.5362910628318787, -0.4777311086654663, -0.41917115449905396, -0.3606112003326416, -0.30205127596855164, -0.24349132180213928, -0.18493136763572693, -0.12637144327163696, -0.06781148910522461, -0.009251534938812256, 0.0493084117770195, 0.10786835849285126, 0.16642829775810242, 0.22498825192451477, 0.2835482060909271, 0.3421081304550171, 0.40066808462142944, 0.4592280387878418, 0.5177879929542542, 0.5763479471206665, 0.6349078416824341, 0.6934678554534912, 0.7520277500152588, 0.8105877041816711, 0.8691476583480835, 0.9277076721191406, 0.986267626285553, 1.0448275804519653, 1.103387475013733, 1.16194748878479, 1.2205073833465576, 1.2790672779083252, 1.3376272916793823, 1.3961873054504395, 1.454747200012207, 1.5133072137832642, 1.5718671083450317, 1.6304271221160889, 1.6889870166778564, 1.747546911239624, 1.8061069250106812, 1.8646668195724487, 1.9232267141342163, 1.9817867279052734, 2.040346622467041, 2.0989065170288086, 2.1574666500091553, 2.216026544570923, 2.2745864391326904, 2.333146333694458, 2.3917062282562256, 2.450266122817993, 2.50882625579834, 2.5673861503601074, 2.625946044921875, 2.6845059394836426, 2.74306583404541, 2.801625967025757]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 12.0, 14.0, 21.0, 28.0, 32.0, 63.0, 86.0, 87.0, 110.0, 140.0, 124.0, 85.0, 59.0, 45.0, 23.0, 20.0, 9.0, 8.0, 8.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1661746501922607, -1.1209747791290283, -1.0757747888565063, -1.030574917793274, -0.9853750467300415, -0.9401751160621643, -0.8949751853942871, -0.8497753143310547, -0.8045753836631775, -0.7593754529953003, -0.7141755819320679, -0.6689756512641907, -0.6237757205963135, -0.578575849533081, -0.5333759188652039, -0.48817601799964905, -0.44297611713409424, -0.39777621626853943, -0.3525763154029846, -0.3073763847351074, -0.2621764838695526, -0.2169765830039978, -0.1717766523361206, -0.1265767514705658, -0.08137685060501099, -0.03617694228887558, 0.009022966027259827, 0.05422288179397583, 0.09942278265953064, 0.14462268352508545, 0.18982261419296265, 0.23502251505851746, 0.2802225351333618, 0.3254224359989166, 0.37062233686447144, 0.41582226753234863, 0.46102216839790344, 0.5062220692634583, 0.5514219999313354, 0.5966218709945679, 0.6418218016624451, 0.6870217323303223, 0.7322216033935547, 0.7774215340614319, 0.8226214647293091, 0.8678213357925415, 0.9130212664604187, 0.9582211971282959, 1.0034210681915283, 1.0486209392547607, 1.0938209295272827, 1.1390208005905151, 1.1842206716537476, 1.2294206619262695, 1.274620532989502, 1.3198204040527344, 1.3650202751159668, 1.4102201461791992, 1.4554201364517212, 1.5006200075149536, 1.545819878578186, 1.591019868850708, 1.6362197399139404, 1.6814196109771729, 1.7266196012496948]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 8.0, 8.0, 8.0, 4.0, 8.0, 12.0, 0.0, 7.0, 13.0, 14.0, 10.0, 28.0, 51.0, 124.0, 287.0, 962.0, 4988.0, 123970.0, 4044390.0, 16579.0, 1914.0, 510.0, 154.0, 63.0, 50.0, 37.0, 28.0, 7.0, 5.0, 9.0, 1.0, 1.0, 4.0, 5.0, 13.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.2109375, -1.1765670776367188, -1.1421966552734375, -1.1078262329101562, -1.073455810546875, -1.0390853881835938, -1.0047149658203125, -0.9703445434570312, -0.93597412109375, -0.9016036987304688, -0.8672332763671875, -0.8328628540039062, -0.798492431640625, -0.7641220092773438, -0.7297515869140625, -0.6953811645507812, -0.6610107421875, -0.6266403198242188, -0.5922698974609375, -0.5578994750976562, -0.523529052734375, -0.48915863037109375, -0.4547882080078125, -0.42041778564453125, -0.38604736328125, -0.35167694091796875, -0.3173065185546875, -0.28293609619140625, -0.248565673828125, -0.21419525146484375, -0.1798248291015625, -0.14545440673828125, -0.111083984375, -0.07671356201171875, -0.0423431396484375, -0.00797271728515625, 0.026397705078125, 0.06076812744140625, 0.0951385498046875, 0.12950897216796875, 0.16387939453125, 0.19824981689453125, 0.2326202392578125, 0.26699066162109375, 0.301361083984375, 0.33573150634765625, 0.3701019287109375, 0.40447235107421875, 0.4388427734375, 0.47321319580078125, 0.5075836181640625, 0.5419540405273438, 0.576324462890625, 0.6106948852539062, 0.6450653076171875, 0.6794357299804688, 0.71380615234375, 0.7481765747070312, 0.7825469970703125, 0.8169174194335938, 0.851287841796875, 0.8856582641601562, 0.9200286865234375, 0.9543991088867188, 0.98876953125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 11.0, 10.0, 14.0, 23.0, 33.0, 48.0, 55.0, 61.0, 76.0, 85.0, 84.0, 94.0, 79.0, 75.0, 44.0, 51.0, 45.0, 34.0, 18.0, 6.0, 7.0, 4.0, 7.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0194091796875, -0.01886439323425293, -0.01831960678100586, -0.01777482032775879, -0.01723003387451172, -0.01668524742126465, -0.016140460968017578, -0.015595674514770508, -0.015050888061523438, -0.014506101608276367, -0.013961315155029297, -0.013416528701782227, -0.012871742248535156, -0.012326955795288086, -0.011782169342041016, -0.011237382888793945, -0.010692596435546875, -0.010147809982299805, -0.009603023529052734, -0.009058237075805664, -0.008513450622558594, -0.007968664169311523, -0.007423877716064453, -0.006879091262817383, -0.0063343048095703125, -0.005789518356323242, -0.005244731903076172, -0.0046999454498291016, -0.004155158996582031, -0.003610372543334961, -0.0030655860900878906, -0.0025207996368408203, -0.00197601318359375, -0.0014312267303466797, -0.0008864402770996094, -0.00034165382385253906, 0.00020313262939453125, 0.0007479190826416016, 0.0012927055358886719, 0.0018374919891357422, 0.0023822784423828125, 0.002927064895629883, 0.003471851348876953, 0.0040166378021240234, 0.004561424255371094, 0.005106210708618164, 0.005650997161865234, 0.006195783615112305, 0.006740570068359375, 0.007285356521606445, 0.007830142974853516, 0.008374929428100586, 0.008919715881347656, 0.009464502334594727, 0.010009288787841797, 0.010554075241088867, 0.011098861694335938, 0.011643648147583008, 0.012188434600830078, 0.012733221054077148, 0.013278007507324219, 0.013822793960571289, 0.01436758041381836, 0.01491236686706543, 0.0154571533203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 12.0, 49.0, 125.0, 575.0, 8043.0, 4137203.0, 46768.0, 1203.0, 198.0, 71.0, 23.0, 7.0, 10.0, 1.0, 1.0], "bins": [-2.3828125, -2.3392333984375, -2.295654296875, -2.2520751953125, -2.20849609375, -2.1649169921875, -2.121337890625, -2.0777587890625, -2.0341796875, -1.9906005859375, -1.947021484375, -1.9034423828125, -1.85986328125, -1.8162841796875, -1.772705078125, -1.7291259765625, -1.685546875, -1.6419677734375, -1.598388671875, -1.5548095703125, -1.51123046875, -1.4676513671875, -1.424072265625, -1.3804931640625, -1.3369140625, -1.2933349609375, -1.249755859375, -1.2061767578125, -1.16259765625, -1.1190185546875, -1.075439453125, -1.0318603515625, -0.98828125, -0.9447021484375, -0.901123046875, -0.8575439453125, -0.81396484375, -0.7703857421875, -0.726806640625, -0.6832275390625, -0.6396484375, -0.5960693359375, -0.552490234375, -0.5089111328125, -0.46533203125, -0.4217529296875, -0.378173828125, -0.3345947265625, -0.291015625, -0.2474365234375, -0.203857421875, -0.1602783203125, -0.11669921875, -0.0731201171875, -0.029541015625, 0.0140380859375, 0.0576171875, 0.1011962890625, 0.144775390625, 0.1883544921875, 0.23193359375, 0.2755126953125, 0.319091796875, 0.3626708984375, 0.40625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 13.0, 13.0, 13.0, 25.0, 24.0, 44.0, 51.0, 97.0, 153.0, 284.0, 777.0, 1516.0, 498.0, 195.0, 118.0, 63.0, 62.0, 34.0, 24.0, 10.0, 9.0, 8.0, 4.0, 7.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.043365478515625, -0.04202413558959961, -0.04068279266357422, -0.03934144973754883, -0.03800010681152344, -0.03665876388549805, -0.035317420959472656, -0.033976078033447266, -0.032634735107421875, -0.031293392181396484, -0.029952049255371094, -0.028610706329345703, -0.027269363403320312, -0.025928020477294922, -0.02458667755126953, -0.02324533462524414, -0.02190399169921875, -0.02056264877319336, -0.01922130584716797, -0.017879962921142578, -0.016538619995117188, -0.015197277069091797, -0.013855934143066406, -0.012514591217041016, -0.011173248291015625, -0.009831905364990234, -0.008490562438964844, -0.007149219512939453, -0.0058078765869140625, -0.004466533660888672, -0.0031251907348632812, -0.0017838478088378906, -0.0004425048828125, 0.0008988380432128906, 0.0022401809692382812, 0.003581523895263672, 0.0049228668212890625, 0.006264209747314453, 0.007605552673339844, 0.008946895599365234, 0.010288238525390625, 0.011629581451416016, 0.012970924377441406, 0.014312267303466797, 0.015653610229492188, 0.016994953155517578, 0.01833629608154297, 0.01967763900756836, 0.02101898193359375, 0.02236032485961914, 0.02370166778564453, 0.025043010711669922, 0.026384353637695312, 0.027725696563720703, 0.029067039489746094, 0.030408382415771484, 0.031749725341796875, 0.033091068267822266, 0.034432411193847656, 0.03577375411987305, 0.03711509704589844, 0.03845643997192383, 0.03979778289794922, 0.04113912582397461, 0.04248046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 42.0, 804.0, 153.0, 13.0, 1.0], "bins": [-5.712839603424072, -5.6185622215271, -5.524285316467285, -5.4300079345703125, -5.33573055267334, -5.241453170776367, -5.147176265716553, -5.05289888381958, -4.958621501922607, -4.864344120025635, -4.77006721496582, -4.675789833068848, -4.581512451171875, -4.487235069274902, -4.392958164215088, -4.298680782318115, -4.204403400421143, -4.11012601852417, -4.0158491134643555, -3.921571731567383, -3.82729434967041, -3.7330172061920166, -3.638739824295044, -3.5444626808166504, -3.450185537338257, -3.3559083938598633, -3.2616310119628906, -3.167353868484497, -3.0730764865875244, -2.978799343109131, -2.884521961212158, -2.7902448177337646, -2.695967435836792, -2.6016902923583984, -2.507412910461426, -2.4131357669830322, -2.3188583850860596, -2.224581241607666, -2.1303038597106934, -2.0360267162323, -1.9417493343353271, -1.847472071647644, -1.753194808959961, -1.6589175462722778, -1.5646402835845947, -1.4703630208969116, -1.3760857582092285, -1.281808614730835, -1.1875313520431519, -1.0932540893554688, -0.9989768266677856, -0.9046995639801025, -0.8104223012924194, -0.7161450386047363, -0.621867835521698, -0.5275905728340149, -0.4333133101463318, -0.3390360474586487, -0.24475879967212677, -0.15048155188560486, -0.05620428919792175, 0.03807297348976135, 0.13235020637512207, 0.22662746906280518, 0.3209047317504883]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 13.0, 9.0, 32.0, 67.0, 76.0, 103.0, 157.0, 165.0, 148.0, 97.0, 69.0, 30.0, 20.0, 13.0, 7.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.9175159335136414, -0.8995136618614197, -0.881511390209198, -0.8635091185569763, -0.8455069065093994, -0.8275046348571777, -0.809502363204956, -0.7915000915527344, -0.7734978199005127, -0.755495548248291, -0.7374932765960693, -0.7194910049438477, -0.701488733291626, -0.6834865212440491, -0.6654842495918274, -0.6474819779396057, -0.629479706287384, -0.6114774346351624, -0.5934751629829407, -0.575472891330719, -0.5574706792831421, -0.5394684076309204, -0.5214661359786987, -0.503463864326477, -0.48546159267425537, -0.4674593210220337, -0.449457049369812, -0.4314548075199127, -0.41345253586769104, -0.39545026421546936, -0.37744802236557007, -0.3594457507133484, -0.3414434790611267, -0.32344120740890503, -0.30543893575668335, -0.28743669390678406, -0.2694344222545624, -0.2514321506023407, -0.2334298938512802, -0.21542763710021973, -0.19742536544799805, -0.17942309379577637, -0.16142083704471588, -0.1434185802936554, -0.12541630864143372, -0.10741404443979263, -0.08941178023815155, -0.07140952348709106, -0.053407251834869385, -0.0354049876332283, -0.01740272343158722, 0.0005995407700538635, 0.018601804971694946, 0.03660406917333603, 0.05460633337497711, 0.0726085901260376, 0.09061086177825928, 0.10861312597990036, 0.12661539018154144, 0.14461764693260193, 0.1626199185848236, 0.1806221902370453, 0.19862444698810577, 0.21662670373916626, 0.23462897539138794]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 3.0, 7.0, 4.0, 11.0, 4.0, 7.0, 12.0, 21.0, 16.0, 32.0, 32.0, 25.0, 27.0, 34.0, 41.0, 65.0, 52.0, 838.0, 1045748.0, 1137.0, 61.0, 57.0, 50.0, 45.0, 32.0, 39.0, 27.0, 34.0, 11.0, 26.0, 9.0, 8.0, 11.0, 7.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.8005828857421875, -1.727142333984375, -1.6537017822265625, -1.58026123046875, -1.5068206787109375, -1.433380126953125, -1.3599395751953125, -1.2864990234375, -1.2130584716796875, -1.139617919921875, -1.0661773681640625, -0.99273681640625, -0.9192962646484375, -0.845855712890625, -0.7724151611328125, -0.698974609375, -0.6255340576171875, -0.552093505859375, -0.4786529541015625, -0.40521240234375, -0.3317718505859375, -0.258331298828125, -0.1848907470703125, -0.1114501953125, -0.0380096435546875, 0.035430908203125, 0.1088714599609375, 0.18231201171875, 0.2557525634765625, 0.329193115234375, 0.4026336669921875, 0.47607421875, 0.5495147705078125, 0.622955322265625, 0.6963958740234375, 0.76983642578125, 0.8432769775390625, 0.916717529296875, 0.9901580810546875, 1.0635986328125, 1.1370391845703125, 1.210479736328125, 1.2839202880859375, 1.35736083984375, 1.4308013916015625, 1.504241943359375, 1.5776824951171875, 1.651123046875, 1.7245635986328125, 1.798004150390625, 1.8714447021484375, 1.94488525390625, 2.0183258056640625, 2.091766357421875, 2.1652069091796875, 2.2386474609375, 2.3120880126953125, 2.385528564453125, 2.4589691162109375, 2.53240966796875, 2.6058502197265625, 2.679290771484375, 2.7527313232421875, 2.826171875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 34.0, 191.0, 440.0, 277.0, 58.0, 13.0, 1.0], "bins": [-0.2120361328125, -0.20847773551940918, -0.20491933822631836, -0.20136094093322754, -0.19780254364013672, -0.1942441463470459, -0.19068574905395508, -0.18712735176086426, -0.18356895446777344, -0.18001055717468262, -0.1764521598815918, -0.17289376258850098, -0.16933536529541016, -0.16577696800231934, -0.16221857070922852, -0.1586601734161377, -0.15510177612304688, -0.15154337882995605, -0.14798498153686523, -0.14442658424377441, -0.1408681869506836, -0.13730978965759277, -0.13375139236450195, -0.13019299507141113, -0.1266345977783203, -0.12307620048522949, -0.11951780319213867, -0.11595940589904785, -0.11240100860595703, -0.10884261131286621, -0.10528421401977539, -0.10172581672668457, -0.09816741943359375, -0.09460902214050293, -0.09105062484741211, -0.08749222755432129, -0.08393383026123047, -0.08037543296813965, -0.07681703567504883, -0.07325863838195801, -0.06970024108886719, -0.06614184379577637, -0.06258344650268555, -0.05902504920959473, -0.055466651916503906, -0.051908254623413086, -0.048349857330322266, -0.044791460037231445, -0.041233062744140625, -0.037674665451049805, -0.034116268157958984, -0.030557870864868164, -0.026999473571777344, -0.023441076278686523, -0.019882678985595703, -0.016324281692504883, -0.012765884399414062, -0.009207487106323242, -0.005649089813232422, -0.0020906925201416016, 0.0014677047729492188, 0.005026102066040039, 0.00858449935913086, 0.01214289665222168, 0.0157012939453125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 20.0, 20.0, 25.0, 32.0, 43.0, 72.0, 93.0, 123.0, 209.0, 359.0, 648.0, 1131.0, 2263.0, 4743.0, 11802.0, 36218.0, 164355.0, 560586.0, 199781.0, 42227.0, 13404.0, 5109.0, 2314.0, 1134.0, 679.0, 402.0, 234.0, 168.0, 118.0, 76.0, 37.0, 29.0, 22.0, 14.0, 14.0, 10.0, 8.0, 7.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.41162109375, -0.39935302734375, -0.3870849609375, -0.37481689453125, -0.362548828125, -0.35028076171875, -0.3380126953125, -0.32574462890625, -0.3134765625, -0.30120849609375, -0.2889404296875, -0.27667236328125, -0.264404296875, -0.25213623046875, -0.2398681640625, -0.22760009765625, -0.21533203125, -0.20306396484375, -0.1907958984375, -0.17852783203125, -0.166259765625, -0.15399169921875, -0.1417236328125, -0.12945556640625, -0.1171875, -0.10491943359375, -0.0926513671875, -0.08038330078125, -0.068115234375, -0.05584716796875, -0.0435791015625, -0.03131103515625, -0.01904296875, -0.00677490234375, 0.0054931640625, 0.01776123046875, 0.030029296875, 0.04229736328125, 0.0545654296875, 0.06683349609375, 0.0791015625, 0.09136962890625, 0.1036376953125, 0.11590576171875, 0.128173828125, 0.14044189453125, 0.1527099609375, 0.16497802734375, 0.17724609375, 0.18951416015625, 0.2017822265625, 0.21405029296875, 0.226318359375, 0.23858642578125, 0.2508544921875, 0.26312255859375, 0.275390625, 0.28765869140625, 0.2999267578125, 0.31219482421875, 0.324462890625, 0.33673095703125, 0.3489990234375, 0.36126708984375, 0.37353515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 7.0, 13.0, 13.0, 20.0, 21.0, 27.0, 38.0, 39.0, 49.0, 48.0, 74.0, 56.0, 71.0, 62.0, 75.0, 65.0, 57.0, 48.0, 42.0, 39.0, 37.0, 21.0, 15.0, 10.0, 12.0, 7.0, 11.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1796875, -0.1738605499267578, -0.16803359985351562, -0.16220664978027344, -0.15637969970703125, -0.15055274963378906, -0.14472579956054688, -0.1388988494873047, -0.1330718994140625, -0.1272449493408203, -0.12141799926757812, -0.11559104919433594, -0.10976409912109375, -0.10393714904785156, -0.09811019897460938, -0.09228324890136719, -0.086456298828125, -0.08062934875488281, -0.07480239868164062, -0.06897544860839844, -0.06314849853515625, -0.05732154846191406, -0.051494598388671875, -0.04566764831542969, -0.0398406982421875, -0.03401374816894531, -0.028186798095703125, -0.022359848022460938, -0.01653289794921875, -0.010705947875976562, -0.004878997802734375, 0.0009479522705078125, 0.00677490234375, 0.012601852416992188, 0.018428802490234375, 0.024255752563476562, 0.03008270263671875, 0.03590965270996094, 0.041736602783203125, 0.04756355285644531, 0.0533905029296875, 0.05921745300292969, 0.06504440307617188, 0.07087135314941406, 0.07669830322265625, 0.08252525329589844, 0.08835220336914062, 0.09417915344238281, 0.100006103515625, 0.10583305358886719, 0.11166000366210938, 0.11748695373535156, 0.12331390380859375, 0.12914085388183594, 0.13496780395507812, 0.1407947540283203, 0.1466217041015625, 0.1524486541748047, 0.15827560424804688, 0.16410255432128906, 0.16992950439453125, 0.17575645446777344, 0.18158340454101562, 0.1874103546142578, 0.1932373046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 6.0, 1.0, 8.0, 9.0, 6.0, 7.0, 13.0, 16.0, 29.0, 35.0, 44.0, 65.0, 98.0, 137.0, 278.0, 446.0, 1080.0, 2888.0, 9695.0, 45474.0, 309479.0, 556002.0, 97495.0, 17523.0, 4579.0, 1590.0, 672.0, 314.0, 187.0, 117.0, 70.0, 44.0, 32.0, 29.0, 18.0, 22.0, 8.0, 13.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3838310241699219, -0.37068939208984375, -0.3575477600097656, -0.3444061279296875, -0.3312644958496094, -0.31812286376953125, -0.3049812316894531, -0.291839599609375, -0.2786979675292969, -0.26555633544921875, -0.2524147033691406, -0.2392730712890625, -0.22613143920898438, -0.21298980712890625, -0.19984817504882812, -0.18670654296875, -0.17356491088867188, -0.16042327880859375, -0.14728164672851562, -0.1341400146484375, -0.12099838256835938, -0.10785675048828125, -0.09471511840820312, -0.081573486328125, -0.06843185424804688, -0.05529022216796875, -0.042148590087890625, -0.0290069580078125, -0.015865325927734375, -0.00272369384765625, 0.010417938232421875, 0.0235595703125, 0.036701202392578125, 0.04984283447265625, 0.06298446655273438, 0.0761260986328125, 0.08926773071289062, 0.10240936279296875, 0.11555099487304688, 0.128692626953125, 0.14183425903320312, 0.15497589111328125, 0.16811752319335938, 0.1812591552734375, 0.19440078735351562, 0.20754241943359375, 0.22068405151367188, 0.23382568359375, 0.24696731567382812, 0.26010894775390625, 0.2732505798339844, 0.2863922119140625, 0.2995338439941406, 0.31267547607421875, 0.3258171081542969, 0.338958740234375, 0.3521003723144531, 0.36524200439453125, 0.3783836364746094, 0.3915252685546875, 0.4046669006347656, 0.41780853271484375, 0.4309501647949219, 0.444091796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 7.0, 9.0, 6.0, 12.0, 11.0, 10.0, 20.0, 29.0, 21.0, 30.0, 35.0, 38.0, 60.0, 74.0, 85.0, 92.0, 68.0, 76.0, 65.0, 45.0, 33.0, 26.0, 24.0, 26.0, 22.0, 13.0, 11.0, 7.0, 6.0, 11.0, 3.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00013589859008789062, -0.00013161450624465942, -0.00012733042240142822, -0.00012304633855819702, -0.00011876225471496582, -0.00011447817087173462, -0.00011019408702850342, -0.00010591000318527222, -0.00010162591934204102, -9.734183549880981e-05, -9.305775165557861e-05, -8.877366781234741e-05, -8.448958396911621e-05, -8.020550012588501e-05, -7.592141628265381e-05, -7.163733243942261e-05, -6.73532485961914e-05, -6.30691647529602e-05, -5.8785080909729004e-05, -5.45009970664978e-05, -5.02169132232666e-05, -4.59328293800354e-05, -4.16487455368042e-05, -3.7364661693573e-05, -3.30805778503418e-05, -2.8796494007110596e-05, -2.4512410163879395e-05, -2.0228326320648193e-05, -1.5944242477416992e-05, -1.1660158634185791e-05, -7.37607479095459e-06, -3.0919909477233887e-06, 1.1920928955078125e-06, 5.476176738739014e-06, 9.760260581970215e-06, 1.4044344425201416e-05, 1.8328428268432617e-05, 2.261251211166382e-05, 2.689659595489502e-05, 3.118067979812622e-05, 3.546476364135742e-05, 3.974884748458862e-05, 4.4032931327819824e-05, 4.8317015171051025e-05, 5.2601099014282227e-05, 5.688518285751343e-05, 6.116926670074463e-05, 6.545335054397583e-05, 6.973743438720703e-05, 7.402151823043823e-05, 7.830560207366943e-05, 8.258968591690063e-05, 8.687376976013184e-05, 9.115785360336304e-05, 9.544193744659424e-05, 9.972602128982544e-05, 0.00010401010513305664, 0.00010829418897628784, 0.00011257827281951904, 0.00011686235666275024, 0.00012114644050598145, 0.00012543052434921265, 0.00012971460819244385, 0.00013399869203567505, 0.00013828277587890625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 17.0, 7.0, 14.0, 31.0, 58.0, 71.0, 142.0, 253.0, 449.0, 1072.0, 3330.0, 15729.0, 136055.0, 755469.0, 117040.0, 13837.0, 2961.0, 1024.0, 461.0, 214.0, 121.0, 69.0, 42.0, 25.0, 23.0, 15.0, 6.0, 3.0, 8.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40771484375, -0.3895721435546875, -0.371429443359375, -0.3532867431640625, -0.33514404296875, -0.3170013427734375, -0.298858642578125, -0.2807159423828125, -0.2625732421875, -0.2444305419921875, -0.226287841796875, -0.2081451416015625, -0.19000244140625, -0.1718597412109375, -0.153717041015625, -0.1355743408203125, -0.117431640625, -0.0992889404296875, -0.081146240234375, -0.0630035400390625, -0.04486083984375, -0.0267181396484375, -0.008575439453125, 0.0095672607421875, 0.0277099609375, 0.0458526611328125, 0.063995361328125, 0.0821380615234375, 0.10028076171875, 0.1184234619140625, 0.136566162109375, 0.1547088623046875, 0.1728515625, 0.1909942626953125, 0.209136962890625, 0.2272796630859375, 0.24542236328125, 0.2635650634765625, 0.281707763671875, 0.2998504638671875, 0.3179931640625, 0.3361358642578125, 0.354278564453125, 0.3724212646484375, 0.39056396484375, 0.4087066650390625, 0.426849365234375, 0.4449920654296875, 0.463134765625, 0.4812774658203125, 0.499420166015625, 0.5175628662109375, 0.53570556640625, 0.5538482666015625, 0.571990966796875, 0.5901336669921875, 0.6082763671875, 0.6264190673828125, 0.644561767578125, 0.6627044677734375, 0.68084716796875, 0.6989898681640625, 0.717132568359375, 0.7352752685546875, 0.75341796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 16.0, 20.0, 23.0, 39.0, 41.0, 73.0, 84.0, 103.0, 122.0, 115.0, 97.0, 75.0, 62.0, 40.0, 22.0, 13.0, 12.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2310791015625, -0.2242145538330078, -0.21735000610351562, -0.21048545837402344, -0.20362091064453125, -0.19675636291503906, -0.18989181518554688, -0.1830272674560547, -0.1761627197265625, -0.1692981719970703, -0.16243362426757812, -0.15556907653808594, -0.14870452880859375, -0.14183998107910156, -0.13497543334960938, -0.1281108856201172, -0.121246337890625, -0.11438179016113281, -0.10751724243164062, -0.10065269470214844, -0.09378814697265625, -0.08692359924316406, -0.08005905151367188, -0.07319450378417969, -0.0663299560546875, -0.05946540832519531, -0.052600860595703125, -0.04573631286621094, -0.03887176513671875, -0.03200721740722656, -0.025142669677734375, -0.018278121948242188, -0.01141357421875, -0.0045490264892578125, 0.002315521240234375, 0.009180068969726562, 0.01604461669921875, 0.022909164428710938, 0.029773712158203125, 0.03663825988769531, 0.0435028076171875, 0.05036735534667969, 0.057231903076171875, 0.06409645080566406, 0.07096099853515625, 0.07782554626464844, 0.08469009399414062, 0.09155464172363281, 0.098419189453125, 0.10528373718261719, 0.11214828491210938, 0.11901283264160156, 0.12587738037109375, 0.13274192810058594, 0.13960647583007812, 0.1464710235595703, 0.1533355712890625, 0.1602001190185547, 0.16706466674804688, 0.17392921447753906, 0.18079376220703125, 0.18765830993652344, 0.19452285766601562, 0.2013874053955078, 0.208251953125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 173.0, 708.0, 109.0, 10.0, 6.0, 1.0, 0.0, 1.0], "bins": [-22.180301666259766, -21.79336929321289, -21.406436920166016, -21.01950454711914, -20.632572174072266, -20.24563980102539, -19.858707427978516, -19.47177505493164, -19.084842681884766, -18.69791030883789, -18.310977935791016, -17.92404556274414, -17.537113189697266, -17.15018081665039, -16.763248443603516, -16.37631607055664, -15.989385604858398, -15.602453231811523, -15.215520858764648, -14.828588485717773, -14.441656112670898, -14.05472469329834, -13.667792320251465, -13.28085994720459, -12.893927574157715, -12.50699520111084, -12.120062828063965, -11.73313045501709, -11.346199035644531, -10.959266662597656, -10.572334289550781, -10.185401916503906, -9.798469543457031, -9.411537170410156, -9.024604797363281, -8.637672424316406, -8.250740051269531, -7.8638081550598145, -7.476876258850098, -7.089943885803223, -6.7030110359191895, -6.3160786628723145, -5.929146766662598, -5.542214393615723, -5.155282020568848, -4.768349647521973, -4.381417274475098, -3.994485378265381, -3.607553005218506, -3.220620632171631, -2.833688497543335, -2.446756362915039, -2.059823989868164, -1.6728917360305786, -1.2859594821929932, -0.8990273475646973, -0.5120949745178223, -0.12516272068023682, 0.26176953315734863, 0.6487017869949341, 1.0356340408325195, 1.422566294670105, 1.8094985485076904, 2.1964306831359863, 2.5833630561828613]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 12.0, 10.0, 21.0, 22.0, 29.0, 29.0, 49.0, 46.0, 71.0, 89.0, 87.0, 92.0, 74.0, 70.0, 73.0, 49.0, 49.0, 38.0, 29.0, 20.0, 15.0, 8.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9082056283950806, -1.8585504293441772, -1.8088951110839844, -1.759239912033081, -1.7095847129821777, -1.6599295139312744, -1.6102741956710815, -1.5606189966201782, -1.5109636783599854, -1.461308479309082, -1.4116531610488892, -1.3619979619979858, -1.3123427629470825, -1.2626874446868896, -1.2130322456359863, -1.163377046585083, -1.1137218475341797, -1.0640666484832764, -1.0144113302230835, -0.9647561311721802, -0.9151009321212769, -0.8654456734657288, -0.8157904148101807, -0.7661352157592773, -0.7164799571037292, -0.6668246984481812, -0.6171694993972778, -0.5675142407417297, -0.5178589820861816, -0.4682037830352783, -0.4185485243797302, -0.3688932955265045, -0.3192380666732788, -0.2695828378200531, -0.2199275940656662, -0.1702723503112793, -0.12061712145805359, -0.07096189260482788, -0.021306633949279785, 0.028348594903945923, 0.07800382375717163, 0.12765905261039734, 0.17731429636478424, 0.22696954011917114, 0.27662476897239685, 0.32627999782562256, 0.37593525648117065, 0.42559048533439636, 0.47524571418762207, 0.5249009728431702, 0.5745561718940735, 0.6242114305496216, 0.6738666296005249, 0.723521888256073, 0.7731771469116211, 0.8228323459625244, 0.8724876046180725, 0.9221428632736206, 0.9717980623245239, 1.0214533805847168, 1.0711085796356201, 1.1207637786865234, 1.1704189777374268, 1.2200742959976196, 1.269729495048523]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 6.0, 10.0, 14.0, 15.0, 16.0, 38.0, 30.0, 34.0, 54.0, 61.0, 82.0, 104.0, 143.0, 236.0, 514.0, 1536068.0, 2655931.0, 492.0, 179.0, 88.0, 67.0, 36.0, 20.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.171875, -6.0316162109375, -5.891357421875, -5.7510986328125, -5.61083984375, -5.4705810546875, -5.330322265625, -5.1900634765625, -5.0498046875, -4.9095458984375, -4.769287109375, -4.6290283203125, -4.48876953125, -4.3485107421875, -4.208251953125, -4.0679931640625, -3.927734375, -3.7874755859375, -3.647216796875, -3.5069580078125, -3.36669921875, -3.2264404296875, -3.086181640625, -2.9459228515625, -2.8056640625, -2.6654052734375, -2.525146484375, -2.3848876953125, -2.24462890625, -2.1043701171875, -1.964111328125, -1.8238525390625, -1.68359375, -1.5433349609375, -1.403076171875, -1.2628173828125, -1.12255859375, -0.9822998046875, -0.842041015625, -0.7017822265625, -0.5615234375, -0.4212646484375, -0.281005859375, -0.1407470703125, -0.00048828125, 0.1397705078125, 0.280029296875, 0.4202880859375, 0.560546875, 0.7008056640625, 0.841064453125, 0.9813232421875, 1.12158203125, 1.2618408203125, 1.402099609375, 1.5423583984375, 1.6826171875, 1.8228759765625, 1.963134765625, 2.1033935546875, 2.24365234375, 2.3839111328125, 2.524169921875, 2.6644287109375, 2.8046875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 11.0, 33.0, 109.0, 223.0, 331.0, 199.0, 75.0, 24.0, 7.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.2305908203125, -0.22642183303833008, -0.22225284576416016, -0.21808385848999023, -0.2139148712158203, -0.2097458839416504, -0.20557689666748047, -0.20140790939331055, -0.19723892211914062, -0.1930699348449707, -0.18890094757080078, -0.18473196029663086, -0.18056297302246094, -0.17639398574829102, -0.1722249984741211, -0.16805601119995117, -0.16388702392578125, -0.15971803665161133, -0.1555490493774414, -0.15138006210327148, -0.14721107482910156, -0.14304208755493164, -0.13887310028076172, -0.1347041130065918, -0.13053512573242188, -0.12636613845825195, -0.12219715118408203, -0.11802816390991211, -0.11385917663574219, -0.10969018936157227, -0.10552120208740234, -0.10135221481323242, -0.0971832275390625, -0.09301424026489258, -0.08884525299072266, -0.08467626571655273, -0.08050727844238281, -0.07633829116821289, -0.07216930389404297, -0.06800031661987305, -0.06383132934570312, -0.0596623420715332, -0.05549335479736328, -0.05132436752319336, -0.04715538024902344, -0.042986392974853516, -0.038817405700683594, -0.03464841842651367, -0.03047943115234375, -0.026310443878173828, -0.022141456604003906, -0.017972469329833984, -0.013803482055664062, -0.00963449478149414, -0.005465507507324219, -0.0012965202331542969, 0.002872467041015625, 0.007041454315185547, 0.011210441589355469, 0.01537942886352539, 0.019548416137695312, 0.023717403411865234, 0.027886390686035156, 0.03205537796020508, 0.036224365234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 19.0, 27.0, 42.0, 68.0, 111.0, 225.0, 903.0, 4157383.0, 34683.0, 466.0, 169.0, 85.0, 39.0, 25.0, 20.0, 11.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0546875, -6.7314453125, -6.408203125, -6.0849609375, -5.76171875, -5.4384765625, -5.115234375, -4.7919921875, -4.46875, -4.1455078125, -3.822265625, -3.4990234375, -3.17578125, -2.8525390625, -2.529296875, -2.2060546875, -1.8828125, -1.5595703125, -1.236328125, -0.9130859375, -0.58984375, -0.2666015625, 0.056640625, 0.3798828125, 0.703125, 1.0263671875, 1.349609375, 1.6728515625, 1.99609375, 2.3193359375, 2.642578125, 2.9658203125, 3.2890625, 3.6123046875, 3.935546875, 4.2587890625, 4.58203125, 4.9052734375, 5.228515625, 5.5517578125, 5.875, 6.1982421875, 6.521484375, 6.8447265625, 7.16796875, 7.4912109375, 7.814453125, 8.1376953125, 8.4609375, 8.7841796875, 9.107421875, 9.4306640625, 9.75390625, 10.0771484375, 10.400390625, 10.7236328125, 11.046875, 11.3701171875, 11.693359375, 12.0166015625, 12.33984375, 12.6630859375, 12.986328125, 13.3095703125, 13.6328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 17.0, 76.0, 597.0, 2998.0, 271.0, 78.0, 29.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67822265625, -0.6613922119140625, -0.644561767578125, -0.6277313232421875, -0.61090087890625, -0.5940704345703125, -0.577239990234375, -0.5604095458984375, -0.5435791015625, -0.5267486572265625, -0.509918212890625, -0.4930877685546875, -0.47625732421875, -0.4594268798828125, -0.442596435546875, -0.4257659912109375, -0.408935546875, -0.3921051025390625, -0.375274658203125, -0.3584442138671875, -0.34161376953125, -0.3247833251953125, -0.307952880859375, -0.2911224365234375, -0.2742919921875, -0.2574615478515625, -0.240631103515625, -0.2238006591796875, -0.20697021484375, -0.1901397705078125, -0.173309326171875, -0.1564788818359375, -0.1396484375, -0.1228179931640625, -0.105987548828125, -0.0891571044921875, -0.07232666015625, -0.0554962158203125, -0.038665771484375, -0.0218353271484375, -0.0050048828125, 0.0118255615234375, 0.028656005859375, 0.0454864501953125, 0.06231689453125, 0.0791473388671875, 0.095977783203125, 0.1128082275390625, 0.129638671875, 0.1464691162109375, 0.163299560546875, 0.1801300048828125, 0.19696044921875, 0.2137908935546875, 0.230621337890625, 0.2474517822265625, 0.2642822265625, 0.2811126708984375, 0.297943115234375, 0.3147735595703125, 0.33160400390625, 0.3484344482421875, 0.365264892578125, 0.3820953369140625, 0.39892578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 16.0, 41.0, 222.0, 510.0, 149.0, 34.0, 15.0, 10.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-10.385074615478516, -10.190502166748047, -9.995928764343262, -9.801355361938477, -9.606782913208008, -9.412210464477539, -9.217637062072754, -9.023063659667969, -8.8284912109375, -8.633918762207031, -8.439345359802246, -8.244771957397461, -8.050199508666992, -7.855626583099365, -7.661053657531738, -7.466480731964111, -7.271907806396484, -7.077334880828857, -6.8827619552612305, -6.6881890296936035, -6.493616104125977, -6.29904317855835, -6.104470252990723, -5.909897327423096, -5.715324401855469, -5.520751476287842, -5.326178550720215, -5.131605625152588, -4.937032699584961, -4.742459774017334, -4.547886848449707, -4.35331392288208, -4.158741474151611, -3.9641685485839844, -3.7695956230163574, -3.5750226974487305, -3.3804497718811035, -3.1858768463134766, -2.9913039207458496, -2.7967309951782227, -2.6021580696105957, -2.4075851440429688, -2.213012218475342, -2.018439292907715, -1.823866367340088, -1.629293441772461, -1.434720516204834, -1.240147590637207, -1.04557466506958, -0.8510017395019531, -0.6564288139343262, -0.4618558883666992, -0.26728296279907227, -0.07271003723144531, 0.12186288833618164, 0.3164358139038086, 0.5110087394714355, 0.7055816650390625, 0.9001545906066895, 1.0947275161743164, 1.2893004417419434, 1.4838733673095703, 1.6784462928771973, 1.8730192184448242, 2.067592144012451]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 12.0, 24.0, 47.0, 50.0, 90.0, 94.0, 96.0, 131.0, 119.0, 98.0, 72.0, 55.0, 34.0, 27.0, 17.0, 9.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4142887592315674, -1.3648885488510132, -1.315488338470459, -1.2660882472991943, -1.2166880369186401, -1.167287826538086, -1.1178877353668213, -1.068487524986267, -1.019087314605713, -0.9696871042251587, -0.9202869534492493, -0.8708868026733398, -0.8214865922927856, -0.7720863819122314, -0.722686231136322, -0.6732860803604126, -0.6238858699798584, -0.5744856595993042, -0.5250855088233948, -0.47568532824516296, -0.42628514766693115, -0.37688496708869934, -0.32748478651046753, -0.2780846059322357, -0.2286844253540039, -0.1792842447757721, -0.12988406419754028, -0.08048388361930847, -0.03108370304107666, 0.01831647753715515, 0.06771665811538696, 0.11711683869361877, 0.16651701927185059, 0.2159171998500824, 0.2653173804283142, 0.314717561006546, 0.36411774158477783, 0.41351792216300964, 0.46291810274124146, 0.5123182535171509, 0.5617184638977051, 0.6111186742782593, 0.6605188250541687, 0.7099189758300781, 0.7593191862106323, 0.8087193965911865, 0.858119547367096, 0.9075196981430054, 0.9569199085235596, 1.0063201189041138, 1.055720329284668, 1.1051204204559326, 1.1545206308364868, 1.203920841217041, 1.2533209323883057, 1.3027211427688599, 1.352121353149414, 1.4015215635299683, 1.4509217739105225, 1.500321865081787, 1.5497220754623413, 1.5991222858428955, 1.6485223770141602, 1.6979225873947144, 1.7473227977752686]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 12.0, 17.0, 11.0, 16.0, 29.0, 37.0, 50.0, 54.0, 91.0, 183.0, 302.0, 781.0, 3049.0, 26968.0, 784521.0, 220657.0, 9049.0, 1562.0, 513.0, 219.0, 119.0, 75.0, 45.0, 37.0, 18.0, 20.0, 22.0, 19.0, 13.0, 6.0, 8.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8076171875, -1.7469329833984375, -1.686248779296875, -1.6255645751953125, -1.56488037109375, -1.5041961669921875, -1.443511962890625, -1.3828277587890625, -1.3221435546875, -1.2614593505859375, -1.200775146484375, -1.1400909423828125, -1.07940673828125, -1.0187225341796875, -0.958038330078125, -0.8973541259765625, -0.836669921875, -0.7759857177734375, -0.715301513671875, -0.6546173095703125, -0.59393310546875, -0.5332489013671875, -0.472564697265625, -0.4118804931640625, -0.3511962890625, -0.2905120849609375, -0.229827880859375, -0.1691436767578125, -0.10845947265625, -0.0477752685546875, 0.012908935546875, 0.0735931396484375, 0.13427734375, 0.1949615478515625, 0.255645751953125, 0.3163299560546875, 0.37701416015625, 0.4376983642578125, 0.498382568359375, 0.5590667724609375, 0.6197509765625, 0.6804351806640625, 0.741119384765625, 0.8018035888671875, 0.86248779296875, 0.9231719970703125, 0.983856201171875, 1.0445404052734375, 1.105224609375, 1.1659088134765625, 1.226593017578125, 1.2872772216796875, 1.34796142578125, 1.4086456298828125, 1.469329833984375, 1.5300140380859375, 1.5906982421875, 1.6513824462890625, 1.712066650390625, 1.7727508544921875, 1.83343505859375, 1.8941192626953125, 1.954803466796875, 2.0154876708984375, 2.076171875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 12.0, 38.0, 64.0, 138.0, 178.0, 232.0, 165.0, 105.0, 46.0, 16.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.261962890625, -0.2569441795349121, -0.2519254684448242, -0.24690675735473633, -0.24188804626464844, -0.23686933517456055, -0.23185062408447266, -0.22683191299438477, -0.22181320190429688, -0.21679449081420898, -0.2117757797241211, -0.2067570686340332, -0.2017383575439453, -0.19671964645385742, -0.19170093536376953, -0.18668222427368164, -0.18166351318359375, -0.17664480209350586, -0.17162609100341797, -0.16660737991333008, -0.1615886688232422, -0.1565699577331543, -0.1515512466430664, -0.14653253555297852, -0.14151382446289062, -0.13649511337280273, -0.13147640228271484, -0.12645769119262695, -0.12143898010253906, -0.11642026901245117, -0.11140155792236328, -0.10638284683227539, -0.1013641357421875, -0.09634542465209961, -0.09132671356201172, -0.08630800247192383, -0.08128929138183594, -0.07627058029174805, -0.07125186920166016, -0.06623315811157227, -0.061214447021484375, -0.056195735931396484, -0.051177024841308594, -0.0461583137512207, -0.04113960266113281, -0.03612089157104492, -0.03110218048095703, -0.02608346939086914, -0.02106475830078125, -0.01604604721069336, -0.011027336120605469, -0.006008625030517578, -0.0009899139404296875, 0.004028797149658203, 0.009047508239746094, 0.014066219329833984, 0.019084930419921875, 0.024103641510009766, 0.029122352600097656, 0.03414106369018555, 0.03915977478027344, 0.04417848587036133, 0.04919719696044922, 0.05421590805053711, 0.059234619140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 5.0, 6.0, 11.0, 16.0, 15.0, 24.0, 32.0, 29.0, 52.0, 81.0, 112.0, 150.0, 242.0, 360.0, 545.0, 1062.0, 2020.0, 4595.0, 13991.0, 59591.0, 318282.0, 495579.0, 115676.0, 23076.0, 6842.0, 2812.0, 1307.0, 733.0, 437.0, 256.0, 174.0, 134.0, 88.0, 59.0, 46.0, 24.0, 20.0, 17.0, 13.0, 8.0, 4.0, 6.0, 8.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51025390625, -0.492156982421875, -0.47406005859375, -0.455963134765625, -0.4378662109375, -0.419769287109375, -0.40167236328125, -0.383575439453125, -0.365478515625, -0.347381591796875, -0.32928466796875, -0.311187744140625, -0.2930908203125, -0.274993896484375, -0.25689697265625, -0.238800048828125, -0.220703125, -0.202606201171875, -0.18450927734375, -0.166412353515625, -0.1483154296875, -0.130218505859375, -0.11212158203125, -0.094024658203125, -0.075927734375, -0.057830810546875, -0.03973388671875, -0.021636962890625, -0.0035400390625, 0.014556884765625, 0.03265380859375, 0.050750732421875, 0.06884765625, 0.086944580078125, 0.10504150390625, 0.123138427734375, 0.1412353515625, 0.159332275390625, 0.17742919921875, 0.195526123046875, 0.213623046875, 0.231719970703125, 0.24981689453125, 0.267913818359375, 0.2860107421875, 0.304107666015625, 0.32220458984375, 0.340301513671875, 0.3583984375, 0.376495361328125, 0.39459228515625, 0.412689208984375, 0.4307861328125, 0.448883056640625, 0.46697998046875, 0.485076904296875, 0.503173828125, 0.521270751953125, 0.53936767578125, 0.557464599609375, 0.5755615234375, 0.593658447265625, 0.61175537109375, 0.629852294921875, 0.64794921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 2.0, 5.0, 10.0, 9.0, 8.0, 20.0, 13.0, 20.0, 22.0, 25.0, 36.0, 40.0, 46.0, 51.0, 49.0, 51.0, 48.0, 43.0, 63.0, 66.0, 60.0, 64.0, 48.0, 42.0, 32.0, 26.0, 25.0, 25.0, 14.0, 10.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.29833984375, -0.28994178771972656, -0.2815437316894531, -0.2731456756591797, -0.26474761962890625, -0.2563495635986328, -0.24795150756835938, -0.23955345153808594, -0.2311553955078125, -0.22275733947753906, -0.21435928344726562, -0.2059612274169922, -0.19756317138671875, -0.1891651153564453, -0.18076705932617188, -0.17236900329589844, -0.163970947265625, -0.15557289123535156, -0.14717483520507812, -0.1387767791748047, -0.13037872314453125, -0.12198066711425781, -0.11358261108398438, -0.10518455505371094, -0.0967864990234375, -0.08838844299316406, -0.07999038696289062, -0.07159233093261719, -0.06319427490234375, -0.05479621887207031, -0.046398162841796875, -0.03800010681152344, -0.02960205078125, -0.021203994750976562, -0.012805938720703125, -0.0044078826904296875, 0.00399017333984375, 0.012388229370117188, 0.020786285400390625, 0.029184341430664062, 0.0375823974609375, 0.04598045349121094, 0.054378509521484375, 0.06277656555175781, 0.07117462158203125, 0.07957267761230469, 0.08797073364257812, 0.09636878967285156, 0.104766845703125, 0.11316490173339844, 0.12156295776367188, 0.1299610137939453, 0.13835906982421875, 0.1467571258544922, 0.15515518188476562, 0.16355323791503906, 0.1719512939453125, 0.18034934997558594, 0.18874740600585938, 0.1971454620361328, 0.20554351806640625, 0.2139415740966797, 0.22233963012695312, 0.23073768615722656, 0.2391357421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 19.0, 27.0, 43.0, 80.0, 154.0, 317.0, 698.0, 3330.0, 128839.0, 904774.0, 8252.0, 1181.0, 400.0, 211.0, 109.0, 42.0, 25.0, 12.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.072265625, -2.0149993896484375, -1.957733154296875, -1.9004669189453125, -1.84320068359375, -1.7859344482421875, -1.728668212890625, -1.6714019775390625, -1.6141357421875, -1.5568695068359375, -1.499603271484375, -1.4423370361328125, -1.38507080078125, -1.3278045654296875, -1.270538330078125, -1.2132720947265625, -1.156005859375, -1.0987396240234375, -1.041473388671875, -0.9842071533203125, -0.92694091796875, -0.8696746826171875, -0.812408447265625, -0.7551422119140625, -0.6978759765625, -0.6406097412109375, -0.583343505859375, -0.5260772705078125, -0.46881103515625, -0.4115447998046875, -0.354278564453125, -0.2970123291015625, -0.23974609375, -0.1824798583984375, -0.125213623046875, -0.0679473876953125, -0.01068115234375, 0.0465850830078125, 0.103851318359375, 0.1611175537109375, 0.2183837890625, 0.2756500244140625, 0.332916259765625, 0.3901824951171875, 0.44744873046875, 0.5047149658203125, 0.561981201171875, 0.6192474365234375, 0.676513671875, 0.7337799072265625, 0.791046142578125, 0.8483123779296875, 0.90557861328125, 0.9628448486328125, 1.020111083984375, 1.0773773193359375, 1.1346435546875, 1.1919097900390625, 1.249176025390625, 1.3064422607421875, 1.36370849609375, 1.4209747314453125, 1.478240966796875, 1.5355072021484375, 1.5927734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 7.0, 2.0, 9.0, 9.0, 6.0, 11.0, 6.0, 16.0, 24.0, 17.0, 38.0, 34.0, 38.0, 57.0, 71.0, 81.0, 86.0, 87.0, 75.0, 54.0, 52.0, 44.0, 33.0, 25.0, 18.0, 15.0, 12.0, 17.0, 7.0, 10.0, 10.0, 4.0, 7.0, 6.0, 0.0, 3.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011813640594482422, -0.00011442694813013077, -0.00011071749031543732, -0.00010700803250074387, -0.00010329857468605042, -9.958911687135696e-05, -9.587965905666351e-05, -9.217020124197006e-05, -8.846074342727661e-05, -8.475128561258316e-05, -8.104182779788971e-05, -7.733236998319626e-05, -7.362291216850281e-05, -6.991345435380936e-05, -6.62039965391159e-05, -6.249453872442245e-05, -5.8785080909729004e-05, -5.507562309503555e-05, -5.13661652803421e-05, -4.765670746564865e-05, -4.39472496509552e-05, -4.023779183626175e-05, -3.65283340215683e-05, -3.281887620687485e-05, -2.9109418392181396e-05, -2.5399960577487946e-05, -2.1690502762794495e-05, -1.7981044948101044e-05, -1.4271587133407593e-05, -1.0562129318714142e-05, -6.852671504020691e-06, -3.14321368932724e-06, 5.662441253662109e-07, 4.275701940059662e-06, 7.985159754753113e-06, 1.1694617569446564e-05, 1.5404075384140015e-05, 1.9113533198833466e-05, 2.2822991013526917e-05, 2.6532448828220367e-05, 3.024190664291382e-05, 3.395136445760727e-05, 3.766082227230072e-05, 4.137028008699417e-05, 4.507973790168762e-05, 4.878919571638107e-05, 5.2498653531074524e-05, 5.6208111345767975e-05, 5.9917569160461426e-05, 6.362702697515488e-05, 6.733648478984833e-05, 7.104594260454178e-05, 7.475540041923523e-05, 7.846485823392868e-05, 8.217431604862213e-05, 8.588377386331558e-05, 8.959323167800903e-05, 9.330268949270248e-05, 9.701214730739594e-05, 0.00010072160512208939, 0.00010443106293678284, 0.00010814052075147629, 0.00011184997856616974, 0.00011555943638086319, 0.00011926889419555664]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 6.0, 3.0, 12.0, 16.0, 28.0, 51.0, 78.0, 131.0, 223.0, 426.0, 876.0, 2669.0, 10718.0, 87232.0, 831652.0, 98520.0, 11342.0, 2775.0, 923.0, 376.0, 179.0, 112.0, 62.0, 39.0, 25.0, 15.0, 12.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77294921875, -0.74676513671875, -0.7205810546875, -0.69439697265625, -0.668212890625, -0.64202880859375, -0.6158447265625, -0.58966064453125, -0.5634765625, -0.53729248046875, -0.5111083984375, -0.48492431640625, -0.458740234375, -0.43255615234375, -0.4063720703125, -0.38018798828125, -0.35400390625, -0.32781982421875, -0.3016357421875, -0.27545166015625, -0.249267578125, -0.22308349609375, -0.1968994140625, -0.17071533203125, -0.14453125, -0.11834716796875, -0.0921630859375, -0.06597900390625, -0.039794921875, -0.01361083984375, 0.0125732421875, 0.03875732421875, 0.06494140625, 0.09112548828125, 0.1173095703125, 0.14349365234375, 0.169677734375, 0.19586181640625, 0.2220458984375, 0.24822998046875, 0.2744140625, 0.30059814453125, 0.3267822265625, 0.35296630859375, 0.379150390625, 0.40533447265625, 0.4315185546875, 0.45770263671875, 0.48388671875, 0.51007080078125, 0.5362548828125, 0.56243896484375, 0.588623046875, 0.61480712890625, 0.6409912109375, 0.66717529296875, 0.693359375, 0.71954345703125, 0.7457275390625, 0.77191162109375, 0.798095703125, 0.82427978515625, 0.8504638671875, 0.87664794921875, 0.90283203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 10.0, 14.0, 28.0, 54.0, 81.0, 109.0, 154.0, 147.0, 114.0, 100.0, 67.0, 43.0, 15.0, 15.0, 7.0, 8.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.445068359375, -0.4340171813964844, -0.42296600341796875, -0.4119148254394531, -0.4008636474609375, -0.3898124694824219, -0.37876129150390625, -0.3677101135253906, -0.356658935546875, -0.3456077575683594, -0.33455657958984375, -0.3235054016113281, -0.3124542236328125, -0.3014030456542969, -0.29035186767578125, -0.2793006896972656, -0.26824951171875, -0.2571983337402344, -0.24614715576171875, -0.23509597778320312, -0.2240447998046875, -0.21299362182617188, -0.20194244384765625, -0.19089126586914062, -0.179840087890625, -0.16878890991210938, -0.15773773193359375, -0.14668655395507812, -0.1356353759765625, -0.12458419799804688, -0.11353302001953125, -0.10248184204101562, -0.0914306640625, -0.08037948608398438, -0.06932830810546875, -0.058277130126953125, -0.0472259521484375, -0.036174774169921875, -0.02512359619140625, -0.014072418212890625, -0.003021240234375, 0.008029937744140625, 0.01908111572265625, 0.030132293701171875, 0.0411834716796875, 0.052234649658203125, 0.06328582763671875, 0.07433700561523438, 0.08538818359375, 0.09643936157226562, 0.10749053955078125, 0.11854171752929688, 0.1295928955078125, 0.14064407348632812, 0.15169525146484375, 0.16274642944335938, 0.173797607421875, 0.18484878540039062, 0.19589996337890625, 0.20695114135742188, 0.2180023193359375, 0.22905349731445312, 0.24010467529296875, 0.2511558532714844, 0.26220703125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 10.0, 13.0, 39.0, 97.0, 198.0, 272.0, 179.0, 117.0, 47.0, 14.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.4218430519104, -7.24770975112915, -7.0735764503479, -6.899442672729492, -6.725309371948242, -6.551176071166992, -6.377042770385742, -6.202909469604492, -6.028775691986084, -5.854642391204834, -5.680509090423584, -5.506375312805176, -5.332242012023926, -5.158108711242676, -4.983975410461426, -4.809842109680176, -4.635708808898926, -4.461575508117676, -4.287442207336426, -4.113308429718018, -3.9391751289367676, -3.7650418281555176, -3.5909085273742676, -3.4167749881744385, -3.2426414489746094, -3.0685081481933594, -2.8943746089935303, -2.7202413082122803, -2.546107769012451, -2.371974468231201, -2.197841167449951, -2.023707628250122, -1.8495738506317139, -1.6754404306411743, -1.5013070106506348, -1.3271737098693848, -1.1530401706695557, -0.9789068102836609, -0.8047734498977661, -0.6306400299072266, -0.456506609916687, -0.28237318992614746, -0.1082397997379303, 0.06589359045028687, 0.24002701044082642, 0.41416043043136597, 0.5882937908172607, 0.7624272108078003, 0.9365606307983398, 1.1106940507888794, 1.284827470779419, 1.458960771560669, 1.633094310760498, 1.807227611541748, 1.9813610315322876, 2.155494451522827, 2.3296279907226562, 2.5037612915039062, 2.6778948307037354, 2.8520281314849854, 3.0261616706848145, 3.2002949714660645, 3.3744282722473145, 3.5485618114471436, 3.7226951122283936]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 7.0, 6.0, 8.0, 14.0, 21.0, 13.0, 32.0, 29.0, 24.0, 44.0, 48.0, 54.0, 49.0, 45.0, 64.0, 57.0, 53.0, 61.0, 40.0, 54.0, 48.0, 39.0, 38.0, 26.0, 27.0, 17.0, 13.0, 24.0, 11.0, 11.0, 7.0, 8.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0], "bins": [-2.2807202339172363, -2.2223715782165527, -2.164022922515869, -2.1056742668151855, -2.047325611114502, -1.9889768362045288, -1.9306280612945557, -1.872279405593872, -1.8139307498931885, -1.7555820941925049, -1.6972334384918213, -1.6388846635818481, -1.5805360078811646, -1.522187352180481, -1.4638385772705078, -1.4054899215698242, -1.3471412658691406, -1.288792610168457, -1.2304439544677734, -1.1720951795578003, -1.1137465238571167, -1.055397868156433, -0.9970491528511047, -0.9387004375457764, -0.8803517818450928, -0.8220031261444092, -0.7636544108390808, -0.7053056955337524, -0.6469570398330688, -0.5886083841323853, -0.5302596688270569, -0.4719109833240509, -0.4135622978210449, -0.35521361231803894, -0.29686492681503296, -0.23851624131202698, -0.180167555809021, -0.12181887030601501, -0.06347018480300903, -0.005121499300003052, 0.05322718620300293, 0.11157587170600891, 0.1699245572090149, 0.22827324271202087, 0.28662192821502686, 0.34497061371803284, 0.4033192992210388, 0.4616679847240448, 0.5200166702270508, 0.5783653259277344, 0.6367140412330627, 0.6950627565383911, 0.7534114122390747, 0.8117600679397583, 0.8701087832450867, 0.928457498550415, 0.9868061542510986, 1.0451548099517822, 1.1035034656524658, 1.161852240562439, 1.2202008962631226, 1.2785495519638062, 1.3368983268737793, 1.395246982574463, 1.4535956382751465]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 7.0, 5.0, 13.0, 13.0, 15.0, 23.0, 17.0, 18.0, 24.0, 35.0, 33.0, 61.0, 63.0, 98.0, 144.0, 218.0, 589.0, 1993.0, 16505.0, 3264047.0, 893623.0, 14081.0, 1825.0, 425.0, 167.0, 72.0, 48.0, 34.0, 21.0, 18.0, 14.0, 6.0, 6.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.751953125, -2.6732177734375, -2.594482421875, -2.5157470703125, -2.43701171875, -2.3582763671875, -2.279541015625, -2.2008056640625, -2.1220703125, -2.0433349609375, -1.964599609375, -1.8858642578125, -1.80712890625, -1.7283935546875, -1.649658203125, -1.5709228515625, -1.4921875, -1.4134521484375, -1.334716796875, -1.2559814453125, -1.17724609375, -1.0985107421875, -1.019775390625, -0.9410400390625, -0.8623046875, -0.7835693359375, -0.704833984375, -0.6260986328125, -0.54736328125, -0.4686279296875, -0.389892578125, -0.3111572265625, -0.232421875, -0.1536865234375, -0.074951171875, 0.0037841796875, 0.08251953125, 0.1612548828125, 0.239990234375, 0.3187255859375, 0.3974609375, 0.4761962890625, 0.554931640625, 0.6336669921875, 0.71240234375, 0.7911376953125, 0.869873046875, 0.9486083984375, 1.02734375, 1.1060791015625, 1.184814453125, 1.2635498046875, 1.34228515625, 1.4210205078125, 1.499755859375, 1.5784912109375, 1.6572265625, 1.7359619140625, 1.814697265625, 1.8934326171875, 1.97216796875, 2.0509033203125, 2.129638671875, 2.2083740234375, 2.287109375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 33.0, 78.0, 126.0, 142.0, 193.0, 159.0, 117.0, 76.0, 37.0, 18.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24529647827148438, -0.24034881591796875, -0.23540115356445312, -0.2304534912109375, -0.22550582885742188, -0.22055816650390625, -0.21561050415039062, -0.210662841796875, -0.20571517944335938, -0.20076751708984375, -0.19581985473632812, -0.1908721923828125, -0.18592453002929688, -0.18097686767578125, -0.17602920532226562, -0.17108154296875, -0.16613388061523438, -0.16118621826171875, -0.15623855590820312, -0.1512908935546875, -0.14634323120117188, -0.14139556884765625, -0.13644790649414062, -0.131500244140625, -0.12655258178710938, -0.12160491943359375, -0.11665725708007812, -0.1117095947265625, -0.10676193237304688, -0.10181427001953125, -0.09686660766601562, -0.0919189453125, -0.08697128295898438, -0.08202362060546875, -0.07707595825195312, -0.0721282958984375, -0.06718063354492188, -0.06223297119140625, -0.057285308837890625, -0.052337646484375, -0.047389984130859375, -0.04244232177734375, -0.037494659423828125, -0.0325469970703125, -0.027599334716796875, -0.02265167236328125, -0.017704010009765625, -0.01275634765625, -0.007808685302734375, -0.00286102294921875, 0.002086639404296875, 0.0070343017578125, 0.011981964111328125, 0.01692962646484375, 0.021877288818359375, 0.026824951171875, 0.031772613525390625, 0.03672027587890625, 0.041667938232421875, 0.0466156005859375, 0.051563262939453125, 0.05651092529296875, 0.061458587646484375, 0.06640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 10.0, 13.0, 12.0, 20.0, 30.0, 49.0, 47.0, 92.0, 202.0, 609.0, 2918.0, 3919008.0, 268346.0, 2044.0, 491.0, 160.0, 64.0, 46.0, 39.0, 22.0, 19.0, 9.0, 10.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.08935546875, -6.8740234375, -6.65869140625, -6.443359375, -6.22802734375, -6.0126953125, -5.79736328125, -5.58203125, -5.36669921875, -5.1513671875, -4.93603515625, -4.720703125, -4.50537109375, -4.2900390625, -4.07470703125, -3.859375, -3.64404296875, -3.4287109375, -3.21337890625, -2.998046875, -2.78271484375, -2.5673828125, -2.35205078125, -2.13671875, -1.92138671875, -1.7060546875, -1.49072265625, -1.275390625, -1.06005859375, -0.8447265625, -0.62939453125, -0.4140625, -0.19873046875, 0.0166015625, 0.23193359375, 0.447265625, 0.66259765625, 0.8779296875, 1.09326171875, 1.30859375, 1.52392578125, 1.7392578125, 1.95458984375, 2.169921875, 2.38525390625, 2.6005859375, 2.81591796875, 3.03125, 3.24658203125, 3.4619140625, 3.67724609375, 3.892578125, 4.10791015625, 4.3232421875, 4.53857421875, 4.75390625, 4.96923828125, 5.1845703125, 5.39990234375, 5.615234375, 5.83056640625, 6.0458984375, 6.26123046875, 6.4765625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 12.0, 15.0, 33.0, 109.0, 468.0, 2817.0, 453.0, 124.0, 27.0, 16.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73828125, -0.7204818725585938, -0.7026824951171875, -0.6848831176757812, -0.667083740234375, -0.6492843627929688, -0.6314849853515625, -0.6136856079101562, -0.59588623046875, -0.5780868530273438, -0.5602874755859375, -0.5424880981445312, -0.524688720703125, -0.5068893432617188, -0.4890899658203125, -0.47129058837890625, -0.4534912109375, -0.43569183349609375, -0.4178924560546875, -0.40009307861328125, -0.382293701171875, -0.36449432373046875, -0.3466949462890625, -0.32889556884765625, -0.31109619140625, -0.29329681396484375, -0.2754974365234375, -0.25769805908203125, -0.239898681640625, -0.22209930419921875, -0.2042999267578125, -0.18650054931640625, -0.168701171875, -0.15090179443359375, -0.1331024169921875, -0.11530303955078125, -0.097503662109375, -0.07970428466796875, -0.0619049072265625, -0.04410552978515625, -0.02630615234375, -0.00850677490234375, 0.0092926025390625, 0.02709197998046875, 0.044891357421875, 0.06269073486328125, 0.0804901123046875, 0.09828948974609375, 0.1160888671875, 0.13388824462890625, 0.1516876220703125, 0.16948699951171875, 0.187286376953125, 0.20508575439453125, 0.2228851318359375, 0.24068450927734375, 0.25848388671875, 0.27628326416015625, 0.2940826416015625, 0.31188201904296875, 0.329681396484375, 0.34748077392578125, 0.3652801513671875, 0.38307952880859375, 0.40087890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 12.0, 11.0, 24.0, 55.0, 106.0, 164.0, 215.0, 174.0, 109.0, 46.0, 29.0, 18.0, 9.0, 7.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0067596435546875, -3.910369396209717, -3.813978910446167, -3.7175886631011963, -3.6211984157562256, -3.524807929992676, -3.428417682647705, -3.3320274353027344, -3.2356371879577637, -3.139246940612793, -3.042856454849243, -2.9464662075042725, -2.8500759601593018, -2.753685474395752, -2.6572952270507812, -2.5609049797058105, -2.4645144939422607, -2.36812424659729, -2.2717337608337402, -2.1753435134887695, -2.078953266143799, -1.9825628995895386, -1.8861725330352783, -1.7897822856903076, -1.6933919191360474, -1.597001552581787, -1.5006113052368164, -1.4042209386825562, -1.307830572128296, -1.2114403247833252, -1.115049958229065, -1.0186595916748047, -0.9222695827484131, -0.8258792757987976, -0.7294889688491821, -0.6330986022949219, -0.5367082953453064, -0.4403179883956909, -0.34392762184143066, -0.24753731489181519, -0.1511470079421997, -0.054756686091423035, 0.04163363575935364, 0.1380239725112915, 0.23441427946090698, 0.33080458641052246, 0.4271949529647827, 0.5235852599143982, 0.6199755668640137, 0.7163658738136292, 0.8127561807632446, 0.9091465473175049, 1.0055367946624756, 1.1019271612167358, 1.198317527770996, 1.2947077751159668, 1.391098141670227, 1.4874885082244873, 1.583878755569458, 1.6802691221237183, 1.7766594886779785, 1.8730497360229492, 1.9694401025772095, 2.0658304691314697, 2.1622207164764404]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 7.0, 9.0, 11.0, 16.0, 19.0, 27.0, 38.0, 41.0, 35.0, 68.0, 64.0, 72.0, 53.0, 60.0, 82.0, 62.0, 51.0, 62.0, 42.0, 32.0, 35.0, 25.0, 28.0, 13.0, 12.0, 12.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0176641941070557, -0.9888597130775452, -0.9600552916526794, -0.931250810623169, -0.9024463295936584, -0.873641848564148, -0.8448374271392822, -0.8160329461097717, -0.7872284650802612, -0.7584239840507507, -0.729619562625885, -0.7008150815963745, -0.672010600566864, -0.6432061195373535, -0.6144016981124878, -0.5855972170829773, -0.5567927360534668, -0.5279882550239563, -0.4991838037967682, -0.4703793525695801, -0.4415748715400696, -0.41277042031288147, -0.38396596908569336, -0.35516148805618286, -0.32635706663131714, -0.29755261540412903, -0.26874813437461853, -0.23994368314743042, -0.21113920211791992, -0.1823347508907318, -0.1535302847623825, -0.1247258186340332, -0.0959213376045227, -0.0671168714761734, -0.038312409073114395, -0.00950794667005539, 0.019296519458293915, 0.04810097813606262, 0.07690544426441193, 0.10570991039276123, 0.13451437652111053, 0.16331884264945984, 0.19212330877780914, 0.22092777490615845, 0.24973222613334656, 0.27853667736053467, 0.30734115839004517, 0.33614563941955566, 0.3649500906467438, 0.3937545418739319, 0.4225590229034424, 0.4513634741306305, 0.480167955160141, 0.5089724063873291, 0.5377768874168396, 0.5665813684463501, 0.5953857898712158, 0.6241902709007263, 0.652994692325592, 0.6817991733551025, 0.710603654384613, 0.7394081354141235, 0.7682125568389893, 0.7970170378684998, 0.8258215188980103]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 4.0, 11.0, 21.0, 12.0, 36.0, 35.0, 82.0, 96.0, 214.0, 449.0, 1202.0, 5922.0, 76843.0, 871069.0, 84084.0, 6085.0, 1280.0, 502.0, 242.0, 122.0, 81.0, 48.0, 29.0, 18.0, 20.0, 12.0, 13.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.958984375, -1.892608642578125, -1.82623291015625, -1.759857177734375, -1.6934814453125, -1.627105712890625, -1.56072998046875, -1.494354248046875, -1.427978515625, -1.361602783203125, -1.29522705078125, -1.228851318359375, -1.1624755859375, -1.096099853515625, -1.02972412109375, -0.963348388671875, -0.89697265625, -0.830596923828125, -0.76422119140625, -0.697845458984375, -0.6314697265625, -0.565093994140625, -0.49871826171875, -0.432342529296875, -0.365966796875, -0.299591064453125, -0.23321533203125, -0.166839599609375, -0.1004638671875, -0.034088134765625, 0.03228759765625, 0.098663330078125, 0.1650390625, 0.231414794921875, 0.29779052734375, 0.364166259765625, 0.4305419921875, 0.496917724609375, 0.56329345703125, 0.629669189453125, 0.696044921875, 0.762420654296875, 0.82879638671875, 0.895172119140625, 0.9615478515625, 1.027923583984375, 1.09429931640625, 1.160675048828125, 1.22705078125, 1.293426513671875, 1.35980224609375, 1.426177978515625, 1.4925537109375, 1.558929443359375, 1.62530517578125, 1.691680908203125, 1.758056640625, 1.824432373046875, 1.89080810546875, 1.957183837890625, 2.0235595703125, 2.089935302734375, 2.15631103515625, 2.222686767578125, 2.2890625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 15.0, 35.0, 62.0, 76.0, 110.0, 139.0, 170.0, 140.0, 95.0, 66.0, 30.0, 22.0, 23.0, 13.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.230224609375, -0.22546005249023438, -0.22069549560546875, -0.21593093872070312, -0.2111663818359375, -0.20640182495117188, -0.20163726806640625, -0.19687271118164062, -0.192108154296875, -0.18734359741210938, -0.18257904052734375, -0.17781448364257812, -0.1730499267578125, -0.16828536987304688, -0.16352081298828125, -0.15875625610351562, -0.15399169921875, -0.14922714233398438, -0.14446258544921875, -0.13969802856445312, -0.1349334716796875, -0.13016891479492188, -0.12540435791015625, -0.12063980102539062, -0.115875244140625, -0.11111068725585938, -0.10634613037109375, -0.10158157348632812, -0.0968170166015625, -0.09205245971679688, -0.08728790283203125, -0.08252334594726562, -0.0777587890625, -0.07299423217773438, -0.06822967529296875, -0.06346511840820312, -0.0587005615234375, -0.053936004638671875, -0.04917144775390625, -0.044406890869140625, -0.039642333984375, -0.034877777099609375, -0.03011322021484375, -0.025348663330078125, -0.0205841064453125, -0.015819549560546875, -0.01105499267578125, -0.006290435791015625, -0.00152587890625, 0.003238677978515625, 0.00800323486328125, 0.012767791748046875, 0.0175323486328125, 0.022296905517578125, 0.02706146240234375, 0.031826019287109375, 0.036590576171875, 0.041355133056640625, 0.04611968994140625, 0.050884246826171875, 0.0556488037109375, 0.060413360595703125, 0.06517791748046875, 0.06994247436523438, 0.07470703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 4.0, 8.0, 10.0, 24.0, 16.0, 15.0, 29.0, 33.0, 54.0, 74.0, 110.0, 158.0, 253.0, 384.0, 696.0, 1320.0, 2645.0, 6691.0, 20248.0, 95108.0, 499867.0, 340031.0, 56742.0, 14190.0, 5029.0, 2193.0, 1024.0, 592.0, 325.0, 207.0, 127.0, 98.0, 68.0, 50.0, 41.0, 20.0, 17.0, 12.0, 8.0, 5.0, 7.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.8017578125, -0.7773513793945312, -0.7529449462890625, -0.7285385131835938, -0.704132080078125, -0.6797256469726562, -0.6553192138671875, -0.6309127807617188, -0.60650634765625, -0.5820999145507812, -0.5576934814453125, -0.5332870483398438, -0.508880615234375, -0.48447418212890625, -0.4600677490234375, -0.43566131591796875, -0.4112548828125, -0.38684844970703125, -0.3624420166015625, -0.33803558349609375, -0.313629150390625, -0.28922271728515625, -0.2648162841796875, -0.24040985107421875, -0.21600341796875, -0.19159698486328125, -0.1671905517578125, -0.14278411865234375, -0.118377685546875, -0.09397125244140625, -0.0695648193359375, -0.04515838623046875, -0.020751953125, 0.00365447998046875, 0.0280609130859375, 0.05246734619140625, 0.076873779296875, 0.10128021240234375, 0.1256866455078125, 0.15009307861328125, 0.17449951171875, 0.19890594482421875, 0.2233123779296875, 0.24771881103515625, 0.272125244140625, 0.29653167724609375, 0.3209381103515625, 0.34534454345703125, 0.3697509765625, 0.39415740966796875, 0.4185638427734375, 0.44297027587890625, 0.467376708984375, 0.49178314208984375, 0.5161895751953125, 0.5405960083007812, 0.56500244140625, 0.5894088745117188, 0.6138153076171875, 0.6382217407226562, 0.662628173828125, 0.6870346069335938, 0.7114410400390625, 0.7358474731445312, 0.76025390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 8.0, 9.0, 8.0, 8.0, 24.0, 17.0, 21.0, 25.0, 30.0, 28.0, 34.0, 31.0, 43.0, 34.0, 40.0, 50.0, 46.0, 36.0, 50.0, 47.0, 44.0, 43.0, 38.0, 39.0, 30.0, 38.0, 27.0, 17.0, 15.0, 18.0, 11.0, 7.0, 9.0, 9.0, 7.0, 6.0, 5.0, 7.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2264404296875, -0.21875572204589844, -0.21107101440429688, -0.2033863067626953, -0.19570159912109375, -0.1880168914794922, -0.18033218383789062, -0.17264747619628906, -0.1649627685546875, -0.15727806091308594, -0.14959335327148438, -0.1419086456298828, -0.13422393798828125, -0.1265392303466797, -0.11885452270507812, -0.11116981506347656, -0.103485107421875, -0.09580039978027344, -0.08811569213867188, -0.08043098449707031, -0.07274627685546875, -0.06506156921386719, -0.057376861572265625, -0.04969215393066406, -0.0420074462890625, -0.03432273864746094, -0.026638031005859375, -0.018953323364257812, -0.01126861572265625, -0.0035839080810546875, 0.004100799560546875, 0.011785507202148438, 0.01947021484375, 0.027154922485351562, 0.034839630126953125, 0.04252433776855469, 0.05020904541015625, 0.05789375305175781, 0.06557846069335938, 0.07326316833496094, 0.0809478759765625, 0.08863258361816406, 0.09631729125976562, 0.10400199890136719, 0.11168670654296875, 0.11937141418457031, 0.12705612182617188, 0.13474082946777344, 0.142425537109375, 0.15011024475097656, 0.15779495239257812, 0.1654796600341797, 0.17316436767578125, 0.1808490753173828, 0.18853378295898438, 0.19621849060058594, 0.2039031982421875, 0.21158790588378906, 0.21927261352539062, 0.2269573211669922, 0.23464202880859375, 0.2423267364501953, 0.2500114440917969, 0.25769615173339844, 0.265380859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 8.0, 6.0, 13.0, 21.0, 24.0, 33.0, 44.0, 78.0, 123.0, 193.0, 457.0, 942.0, 2254.0, 6448.0, 22241.0, 113931.0, 566597.0, 274424.0, 43709.0, 10749.0, 3563.0, 1351.0, 622.0, 286.0, 156.0, 94.0, 54.0, 34.0, 34.0, 18.0, 17.0, 9.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.4241828918457031, -0.41037750244140625, -0.3965721130371094, -0.3827667236328125, -0.3689613342285156, -0.35515594482421875, -0.3413505554199219, -0.327545166015625, -0.3137397766113281, -0.29993438720703125, -0.2861289978027344, -0.2723236083984375, -0.2585182189941406, -0.24471282958984375, -0.23090744018554688, -0.21710205078125, -0.20329666137695312, -0.18949127197265625, -0.17568588256835938, -0.1618804931640625, -0.14807510375976562, -0.13426971435546875, -0.12046432495117188, -0.106658935546875, -0.09285354614257812, -0.07904815673828125, -0.06524276733398438, -0.0514373779296875, -0.037631988525390625, -0.02382659912109375, -0.010021209716796875, 0.0037841796875, 0.017589569091796875, 0.03139495849609375, 0.045200347900390625, 0.0590057373046875, 0.07281112670898438, 0.08661651611328125, 0.10042190551757812, 0.114227294921875, 0.12803268432617188, 0.14183807373046875, 0.15564346313476562, 0.1694488525390625, 0.18325424194335938, 0.19705963134765625, 0.21086502075195312, 0.22467041015625, 0.23847579956054688, 0.25228118896484375, 0.2660865783691406, 0.2798919677734375, 0.2936973571777344, 0.30750274658203125, 0.3213081359863281, 0.335113525390625, 0.3489189147949219, 0.36272430419921875, 0.3765296936035156, 0.3903350830078125, 0.4041404724121094, 0.41794586181640625, 0.4317512512207031, 0.445556640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 8.0, 9.0, 5.0, 11.0, 10.0, 12.0, 12.0, 24.0, 19.0, 34.0, 24.0, 42.0, 44.0, 63.0, 50.0, 63.0, 64.0, 78.0, 62.0, 52.0, 43.0, 41.0, 41.0, 37.0, 24.0, 27.0, 23.0, 16.0, 12.0, 8.0, 9.0, 4.0, 6.0, 7.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-9.018182754516602e-05, -8.776038885116577e-05, -8.533895015716553e-05, -8.291751146316528e-05, -8.049607276916504e-05, -7.80746340751648e-05, -7.565319538116455e-05, -7.32317566871643e-05, -7.081031799316406e-05, -6.838887929916382e-05, -6.596744060516357e-05, -6.354600191116333e-05, -6.112456321716309e-05, -5.870312452316284e-05, -5.62816858291626e-05, -5.3860247135162354e-05, -5.143880844116211e-05, -4.9017369747161865e-05, -4.659593105316162e-05, -4.417449235916138e-05, -4.175305366516113e-05, -3.933161497116089e-05, -3.6910176277160645e-05, -3.44887375831604e-05, -3.2067298889160156e-05, -2.9645860195159912e-05, -2.7224421501159668e-05, -2.4802982807159424e-05, -2.238154411315918e-05, -1.9960105419158936e-05, -1.753866672515869e-05, -1.5117228031158447e-05, -1.2695789337158203e-05, -1.0274350643157959e-05, -7.852911949157715e-06, -5.431473255157471e-06, -3.0100345611572266e-06, -5.885958671569824e-07, 1.8328428268432617e-06, 4.254281520843506e-06, 6.67572021484375e-06, 9.097158908843994e-06, 1.1518597602844238e-05, 1.3940036296844482e-05, 1.6361474990844727e-05, 1.878291368484497e-05, 2.1204352378845215e-05, 2.362579107284546e-05, 2.6047229766845703e-05, 2.8468668460845947e-05, 3.089010715484619e-05, 3.3311545848846436e-05, 3.573298454284668e-05, 3.8154423236846924e-05, 4.057586193084717e-05, 4.299730062484741e-05, 4.5418739318847656e-05, 4.78401780128479e-05, 5.0261616706848145e-05, 5.268305540084839e-05, 5.510449409484863e-05, 5.752593278884888e-05, 5.994737148284912e-05, 6.236881017684937e-05, 6.479024887084961e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 6.0, 8.0, 8.0, 12.0, 6.0, 28.0, 33.0, 48.0, 120.0, 195.0, 427.0, 1096.0, 3248.0, 13414.0, 105775.0, 747449.0, 153504.0, 17184.0, 3776.0, 1264.0, 470.0, 219.0, 112.0, 57.0, 43.0, 17.0, 10.0, 12.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.446044921875, -0.4271202087402344, -0.40819549560546875, -0.3892707824707031, -0.3703460693359375, -0.3514213562011719, -0.33249664306640625, -0.3135719299316406, -0.294647216796875, -0.2757225036621094, -0.25679779052734375, -0.23787307739257812, -0.2189483642578125, -0.20002365112304688, -0.18109893798828125, -0.16217422485351562, -0.14324951171875, -0.12432479858398438, -0.10540008544921875, -0.08647537231445312, -0.0675506591796875, -0.048625946044921875, -0.02970123291015625, -0.010776519775390625, 0.008148193359375, 0.027072906494140625, 0.04599761962890625, 0.06492233276367188, 0.0838470458984375, 0.10277175903320312, 0.12169647216796875, 0.14062118530273438, 0.1595458984375, 0.17847061157226562, 0.19739532470703125, 0.21632003784179688, 0.2352447509765625, 0.2541694641113281, 0.27309417724609375, 0.2920188903808594, 0.310943603515625, 0.3298683166503906, 0.34879302978515625, 0.3677177429199219, 0.3866424560546875, 0.4055671691894531, 0.42449188232421875, 0.4434165954589844, 0.46234130859375, 0.4812660217285156, 0.5001907348632812, 0.5191154479980469, 0.5380401611328125, 0.5569648742675781, 0.5758895874023438, 0.5948143005371094, 0.613739013671875, 0.6326637268066406, 0.6515884399414062, 0.6705131530761719, 0.6894378662109375, 0.7083625793457031, 0.7272872924804688, 0.7462120056152344, 0.76513671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 2.0, 0.0, 6.0, 4.0, 6.0, 3.0, 15.0, 16.0, 27.0, 25.0, 52.0, 47.0, 85.0, 81.0, 115.0, 93.0, 100.0, 81.0, 64.0, 53.0, 31.0, 30.0, 19.0, 20.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25244140625, -0.24381637573242188, -0.23519134521484375, -0.22656631469726562, -0.2179412841796875, -0.20931625366210938, -0.20069122314453125, -0.19206619262695312, -0.183441162109375, -0.17481613159179688, -0.16619110107421875, -0.15756607055664062, -0.1489410400390625, -0.14031600952148438, -0.13169097900390625, -0.12306594848632812, -0.11444091796875, -0.10581588745117188, -0.09719085693359375, -0.08856582641601562, -0.0799407958984375, -0.07131576538085938, -0.06269073486328125, -0.054065704345703125, -0.045440673828125, -0.036815643310546875, -0.02819061279296875, -0.019565582275390625, -0.0109405517578125, -0.002315521240234375, 0.00630950927734375, 0.014934539794921875, 0.0235595703125, 0.032184600830078125, 0.04080963134765625, 0.049434661865234375, 0.0580596923828125, 0.06668472290039062, 0.07530975341796875, 0.08393478393554688, 0.092559814453125, 0.10118484497070312, 0.10980987548828125, 0.11843490600585938, 0.1270599365234375, 0.13568496704101562, 0.14430999755859375, 0.15293502807617188, 0.16156005859375, 0.17018508911132812, 0.17881011962890625, 0.18743515014648438, 0.1960601806640625, 0.20468521118164062, 0.21331024169921875, 0.22193527221679688, 0.230560302734375, 0.23918533325195312, 0.24781036376953125, 0.2564353942871094, 0.2650604248046875, 0.2736854553222656, 0.28231048583984375, 0.2909355163574219, 0.299560546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 14.0, 15.0, 20.0, 43.0, 80.0, 126.0, 137.0, 139.0, 128.0, 123.0, 67.0, 41.0, 25.0, 16.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.451085090637207, -5.325107097625732, -5.199129581451416, -5.073151588439941, -4.947173595428467, -4.821195602416992, -4.695218086242676, -4.569240093231201, -4.443262100219727, -4.317284107208252, -4.1913065910339355, -4.065328598022461, -3.9393506050109863, -3.813372850418091, -3.6873950958251953, -3.5614171028137207, -3.435439348220825, -3.3094615936279297, -3.183483600616455, -3.0575058460235596, -2.931527853012085, -2.8055500984191895, -2.679572105407715, -2.5535943508148193, -2.427616596221924, -2.3016388416290283, -2.1756608486175537, -2.049683094024658, -1.9237051010131836, -1.797727346420288, -1.671749472618103, -1.545771598815918, -1.4197933673858643, -1.2938154935836792, -1.1678376197814941, -1.0418598651885986, -0.9158819317817688, -0.7899040579795837, -0.6639262437820435, -0.5379483699798584, -0.41197049617767334, -0.2859926223754883, -0.1600147783756256, -0.03403693437576294, 0.09194093942642212, 0.21791881322860718, 0.34389662742614746, 0.4698745012283325, 0.5958523750305176, 0.7218302488327026, 0.8478081226348877, 0.973785936832428, 1.0997638702392578, 1.2257416248321533, 1.3517194986343384, 1.4776973724365234, 1.6036752462387085, 1.7296531200408936, 1.8556309938430786, 1.9816088676452637, 2.107586622238159, 2.233564615249634, 2.3595423698425293, 2.485520362854004, 2.6114981174468994]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 2.0, 5.0, 10.0, 11.0, 10.0, 15.0, 22.0, 19.0, 15.0, 22.0, 33.0, 40.0, 41.0, 42.0, 46.0, 40.0, 37.0, 56.0, 40.0, 45.0, 42.0, 51.0, 40.0, 43.0, 40.0, 23.0, 28.0, 19.0, 25.0, 23.0, 21.0, 10.0, 13.0, 17.0, 9.0, 8.0, 6.0, 5.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6530956029891968, -1.6028468608856201, -1.552598237991333, -1.5023494958877563, -1.4521007537841797, -1.401852011680603, -1.3516032695770264, -1.3013546466827393, -1.2511059045791626, -1.200857162475586, -1.1506085395812988, -1.1003597974777222, -1.0501110553741455, -0.9998623132705688, -0.949613630771637, -0.8993649482727051, -0.8491162061691284, -0.7988674640655518, -0.7486187815666199, -0.698370099067688, -0.6481213569641113, -0.5978726148605347, -0.5476239323616028, -0.4973752200603485, -0.44712650775909424, -0.39687779545783997, -0.3466290831565857, -0.2963803708553314, -0.24613165855407715, -0.19588294625282288, -0.1456342339515686, -0.09538552165031433, -0.04513680934906006, 0.005111902952194214, 0.055360615253448486, 0.10560932755470276, 0.15585803985595703, 0.2061067521572113, 0.2563554644584656, 0.30660417675971985, 0.3568528890609741, 0.4071016013622284, 0.45735031366348267, 0.5075989961624146, 0.5578477382659912, 0.6080964803695679, 0.6583451628684998, 0.7085938453674316, 0.7588425874710083, 0.809091329574585, 0.8593400120735168, 0.9095886945724487, 0.9598374366760254, 1.010086178779602, 1.0603349208831787, 1.1105835437774658, 1.1608322858810425, 1.2110810279846191, 1.2613296508789062, 1.311578392982483, 1.3618271350860596, 1.4120758771896362, 1.462324619293213, 1.5125732421875, 1.5628219842910767]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 9.0, 5.0, 7.0, 11.0, 9.0, 18.0, 17.0, 34.0, 32.0, 35.0, 43.0, 72.0, 89.0, 105.0, 195.0, 324.0, 639.0, 1497.0, 5714.0, 41968.0, 3572025.0, 540538.0, 24178.0, 4333.0, 1240.0, 532.0, 247.0, 140.0, 80.0, 49.0, 29.0, 20.0, 15.0, 5.0, 7.0, 9.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.71484375, -2.6500091552734375, -2.585174560546875, -2.5203399658203125, -2.45550537109375, -2.3906707763671875, -2.325836181640625, -2.2610015869140625, -2.1961669921875, -2.1313323974609375, -2.066497802734375, -2.0016632080078125, -1.93682861328125, -1.8719940185546875, -1.807159423828125, -1.7423248291015625, -1.677490234375, -1.6126556396484375, -1.547821044921875, -1.4829864501953125, -1.41815185546875, -1.3533172607421875, -1.288482666015625, -1.2236480712890625, -1.1588134765625, -1.0939788818359375, -1.029144287109375, -0.9643096923828125, -0.89947509765625, -0.8346405029296875, -0.769805908203125, -0.7049713134765625, -0.64013671875, -0.5753021240234375, -0.510467529296875, -0.4456329345703125, -0.38079833984375, -0.3159637451171875, -0.251129150390625, -0.1862945556640625, -0.1214599609375, -0.0566253662109375, 0.008209228515625, 0.0730438232421875, 0.13787841796875, 0.2027130126953125, 0.267547607421875, 0.3323822021484375, 0.397216796875, 0.4620513916015625, 0.526885986328125, 0.5917205810546875, 0.65655517578125, 0.7213897705078125, 0.786224365234375, 0.8510589599609375, 0.9158935546875, 0.9807281494140625, 1.045562744140625, 1.1103973388671875, 1.17523193359375, 1.2400665283203125, 1.304901123046875, 1.3697357177734375, 1.4345703125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 11.0, 23.0, 43.0, 58.0, 87.0, 115.0, 145.0, 144.0, 123.0, 90.0, 67.0, 41.0, 26.0, 17.0, 8.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.240966796875, -0.23606109619140625, -0.2311553955078125, -0.22624969482421875, -0.221343994140625, -0.21643829345703125, -0.2115325927734375, -0.20662689208984375, -0.20172119140625, -0.19681549072265625, -0.1919097900390625, -0.18700408935546875, -0.182098388671875, -0.17719268798828125, -0.1722869873046875, -0.16738128662109375, -0.1624755859375, -0.15756988525390625, -0.1526641845703125, -0.14775848388671875, -0.142852783203125, -0.13794708251953125, -0.1330413818359375, -0.12813568115234375, -0.12322998046875, -0.11832427978515625, -0.1134185791015625, -0.10851287841796875, -0.103607177734375, -0.09870147705078125, -0.0937957763671875, -0.08889007568359375, -0.083984375, -0.07907867431640625, -0.0741729736328125, -0.06926727294921875, -0.064361572265625, -0.05945587158203125, -0.0545501708984375, -0.04964447021484375, -0.04473876953125, -0.03983306884765625, -0.0349273681640625, -0.03002166748046875, -0.025115966796875, -0.02021026611328125, -0.0153045654296875, -0.01039886474609375, -0.0054931640625, -0.00058746337890625, 0.0043182373046875, 0.00922393798828125, 0.014129638671875, 0.01903533935546875, 0.0239410400390625, 0.02884674072265625, 0.03375244140625, 0.03865814208984375, 0.0435638427734375, 0.04846954345703125, 0.053375244140625, 0.05828094482421875, 0.0631866455078125, 0.06809234619140625, 0.072998046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 6.0, 11.0, 27.0, 44.0, 97.0, 120.0, 255.0, 851.0, 23273.0, 4155876.0, 12668.0, 659.0, 196.0, 102.0, 51.0, 22.0, 15.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.705810546875, -4.55615234375, -4.406494140625, -4.2568359375, -4.107177734375, -3.95751953125, -3.807861328125, -3.658203125, -3.508544921875, -3.35888671875, -3.209228515625, -3.0595703125, -2.909912109375, -2.76025390625, -2.610595703125, -2.4609375, -2.311279296875, -2.16162109375, -2.011962890625, -1.8623046875, -1.712646484375, -1.56298828125, -1.413330078125, -1.263671875, -1.114013671875, -0.96435546875, -0.814697265625, -0.6650390625, -0.515380859375, -0.36572265625, -0.216064453125, -0.06640625, 0.083251953125, 0.23291015625, 0.382568359375, 0.5322265625, 0.681884765625, 0.83154296875, 0.981201171875, 1.130859375, 1.280517578125, 1.43017578125, 1.579833984375, 1.7294921875, 1.879150390625, 2.02880859375, 2.178466796875, 2.328125, 2.477783203125, 2.62744140625, 2.777099609375, 2.9267578125, 3.076416015625, 3.22607421875, 3.375732421875, 3.525390625, 3.675048828125, 3.82470703125, 3.974365234375, 4.1240234375, 4.273681640625, 4.42333984375, 4.572998046875, 4.72265625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 8.0, 18.0, 36.0, 135.0, 434.0, 2560.0, 640.0, 147.0, 67.0, 27.0, 5.0, 2.0, 1.0, 4.0], "bins": [-1.0185546875, -1.0002384185791016, -0.9819221496582031, -0.9636058807373047, -0.9452896118164062, -0.9269733428955078, -0.9086570739746094, -0.8903408050537109, -0.8720245361328125, -0.8537082672119141, -0.8353919982910156, -0.8170757293701172, -0.7987594604492188, -0.7804431915283203, -0.7621269226074219, -0.7438106536865234, -0.725494384765625, -0.7071781158447266, -0.6888618469238281, -0.6705455780029297, -0.6522293090820312, -0.6339130401611328, -0.6155967712402344, -0.5972805023193359, -0.5789642333984375, -0.5606479644775391, -0.5423316955566406, -0.5240154266357422, -0.5056991577148438, -0.4873828887939453, -0.4690666198730469, -0.45075035095214844, -0.43243408203125, -0.41411781311035156, -0.3958015441894531, -0.3774852752685547, -0.35916900634765625, -0.3408527374267578, -0.3225364685058594, -0.30422019958496094, -0.2859039306640625, -0.26758766174316406, -0.24927139282226562, -0.2309551239013672, -0.21263885498046875, -0.1943225860595703, -0.17600631713867188, -0.15769004821777344, -0.139373779296875, -0.12105751037597656, -0.10274124145507812, -0.08442497253417969, -0.06610870361328125, -0.04779243469238281, -0.029476165771484375, -0.011159896850585938, 0.0071563720703125, 0.025472640991210938, 0.043788909912109375, 0.06210517883300781, 0.08042144775390625, 0.09873771667480469, 0.11705398559570312, 0.13537025451660156, 0.1536865234375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 9.0, 35.0, 64.0, 108.0, 189.0, 215.0, 159.0, 82.0, 56.0, 22.0, 16.0, 10.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8358864784240723, -2.7601702213287354, -2.6844539642333984, -2.6087377071380615, -2.5330214500427246, -2.457305431365967, -2.381588935852051, -2.305872917175293, -2.230156660079956, -2.154440402984619, -2.0787241458892822, -2.0030078887939453, -1.927291750907898, -1.851575493812561, -1.7758592367172241, -1.7001430988311768, -1.6244267225265503, -1.5487104654312134, -1.4729942083358765, -1.397278070449829, -1.3215618133544922, -1.2458455562591553, -1.1701292991638184, -1.0944130420684814, -1.0186967849731445, -0.9429805278778076, -0.8672643303871155, -0.7915480732917786, -0.7158318758010864, -0.6401156187057495, -0.5643993616104126, -0.48868316411972046, -0.4129669666290283, -0.3372507393360138, -0.26153451204299927, -0.18581825494766235, -0.11010202765464783, -0.0343858003616333, 0.04133045673370361, 0.11704665422439575, 0.19276291131973267, 0.2684791386127472, 0.3441953659057617, 0.41991162300109863, 0.49562785029411316, 0.5713440775871277, 0.6470603346824646, 0.7227765321731567, 0.7984927892684937, 0.8742090463638306, 0.9499252438545227, 1.0256414413452148, 1.1013576984405518, 1.1770739555358887, 1.2527902126312256, 1.3285064697265625, 1.4042227268218994, 1.4799389839172363, 1.5556552410125732, 1.6313714981079102, 1.7070876359939575, 1.7828038930892944, 1.8585201501846313, 1.9342362880706787, 2.0099525451660156]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 11.0, 9.0, 3.0, 11.0, 21.0, 18.0, 44.0, 46.0, 54.0, 58.0, 74.0, 83.0, 73.0, 73.0, 87.0, 68.0, 67.0, 49.0, 38.0, 31.0, 25.0, 18.0, 20.0, 10.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.430869221687317, -1.3889741897583008, -1.3470792770385742, -1.305184245109558, -1.263289213180542, -1.2213941812515259, -1.1794991493225098, -1.1376042366027832, -1.095709204673767, -1.053814172744751, -1.0119192600250244, -0.9700242280960083, -0.9281291961669922, -0.8862341642379761, -0.8443391919136047, -0.8024442195892334, -0.7605491876602173, -0.7186541557312012, -0.6767591834068298, -0.6348642110824585, -0.5929691791534424, -0.5510741472244263, -0.5091791749000549, -0.4672841727733612, -0.4253891706466675, -0.38349416851997375, -0.34159916639328003, -0.2997041642665863, -0.2578091621398926, -0.21591416001319885, -0.17401915788650513, -0.1321241557598114, -0.09022927284240723, -0.0483342707157135, -0.006439268589019775, 0.03545573353767395, 0.07735073566436768, 0.1192457377910614, 0.16114073991775513, 0.20303574204444885, 0.24493074417114258, 0.2868257462978363, 0.32872074842453003, 0.37061575055122375, 0.4125107526779175, 0.4544057548046112, 0.49630075693130493, 0.5381957292556763, 0.5800907611846924, 0.6219857931137085, 0.6638807654380798, 0.7057757377624512, 0.7476707696914673, 0.7895658016204834, 0.8314607739448547, 0.8733557462692261, 0.9152507781982422, 0.9571458101272583, 0.9990407824516296, 1.040935754776001, 1.082830786705017, 1.1247258186340332, 1.1666207313537598, 1.2085157632827759, 1.250410795211792]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 10.0, 5.0, 8.0, 16.0, 16.0, 25.0, 29.0, 61.0, 92.0, 150.0, 243.0, 459.0, 1071.0, 3452.0, 19132.0, 262649.0, 692292.0, 58431.0, 7126.0, 1778.0, 715.0, 329.0, 179.0, 95.0, 58.0, 37.0, 31.0, 22.0, 11.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9306640625, -1.878814697265625, -1.82696533203125, -1.775115966796875, -1.7232666015625, -1.671417236328125, -1.61956787109375, -1.567718505859375, -1.515869140625, -1.464019775390625, -1.41217041015625, -1.360321044921875, -1.3084716796875, -1.256622314453125, -1.20477294921875, -1.152923583984375, -1.10107421875, -1.049224853515625, -0.99737548828125, -0.945526123046875, -0.8936767578125, -0.841827392578125, -0.78997802734375, -0.738128662109375, -0.686279296875, -0.634429931640625, -0.58258056640625, -0.530731201171875, -0.4788818359375, -0.427032470703125, -0.37518310546875, -0.323333740234375, -0.271484375, -0.219635009765625, -0.16778564453125, -0.115936279296875, -0.0640869140625, -0.012237548828125, 0.03961181640625, 0.091461181640625, 0.143310546875, 0.195159912109375, 0.24700927734375, 0.298858642578125, 0.3507080078125, 0.402557373046875, 0.45440673828125, 0.506256103515625, 0.55810546875, 0.609954833984375, 0.66180419921875, 0.713653564453125, 0.7655029296875, 0.817352294921875, 0.86920166015625, 0.921051025390625, 0.972900390625, 1.024749755859375, 1.07659912109375, 1.128448486328125, 1.1802978515625, 1.232147216796875, 1.28399658203125, 1.335845947265625, 1.3876953125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 20.0, 19.0, 34.0, 64.0, 66.0, 102.0, 111.0, 125.0, 111.0, 109.0, 70.0, 49.0, 44.0, 27.0, 17.0, 10.0, 9.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2457275390625, -0.2404613494873047, -0.23519515991210938, -0.22992897033691406, -0.22466278076171875, -0.21939659118652344, -0.21413040161132812, -0.2088642120361328, -0.2035980224609375, -0.1983318328857422, -0.19306564331054688, -0.18779945373535156, -0.18253326416015625, -0.17726707458496094, -0.17200088500976562, -0.1667346954345703, -0.161468505859375, -0.1562023162841797, -0.15093612670898438, -0.14566993713378906, -0.14040374755859375, -0.13513755798339844, -0.12987136840820312, -0.12460517883300781, -0.1193389892578125, -0.11407279968261719, -0.10880661010742188, -0.10354042053222656, -0.09827423095703125, -0.09300804138183594, -0.08774185180664062, -0.08247566223144531, -0.07720947265625, -0.07194328308105469, -0.06667709350585938, -0.06141090393066406, -0.05614471435546875, -0.05087852478027344, -0.045612335205078125, -0.04034614562988281, -0.0350799560546875, -0.029813766479492188, -0.024547576904296875, -0.019281387329101562, -0.01401519775390625, -0.008749008178710938, -0.003482818603515625, 0.0017833709716796875, 0.007049560546875, 0.012315750122070312, 0.017581939697265625, 0.022848129272460938, 0.02811431884765625, 0.03338050842285156, 0.038646697998046875, 0.04391288757324219, 0.0491790771484375, 0.05444526672363281, 0.059711456298828125, 0.06497764587402344, 0.07024383544921875, 0.07551002502441406, 0.08077621459960938, 0.08604240417480469, 0.09130859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 3.0, 3.0, 3.0, 2.0, 6.0, 6.0, 10.0, 16.0, 21.0, 37.0, 45.0, 59.0, 87.0, 185.0, 310.0, 554.0, 1219.0, 2695.0, 7270.0, 33650.0, 334587.0, 584753.0, 65189.0, 11146.0, 3501.0, 1508.0, 734.0, 391.0, 189.0, 142.0, 57.0, 46.0, 33.0, 22.0, 17.0, 12.0, 7.0, 7.0, 6.0, 4.0, 7.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0810546875, -1.0452117919921875, -1.009368896484375, -0.9735260009765625, -0.93768310546875, -0.9018402099609375, -0.865997314453125, -0.8301544189453125, -0.7943115234375, -0.7584686279296875, -0.722625732421875, -0.6867828369140625, -0.65093994140625, -0.6150970458984375, -0.579254150390625, -0.5434112548828125, -0.507568359375, -0.4717254638671875, -0.435882568359375, -0.4000396728515625, -0.36419677734375, -0.3283538818359375, -0.292510986328125, -0.2566680908203125, -0.2208251953125, -0.1849822998046875, -0.149139404296875, -0.1132965087890625, -0.07745361328125, -0.0416107177734375, -0.005767822265625, 0.0300750732421875, 0.06591796875, 0.1017608642578125, 0.137603759765625, 0.1734466552734375, 0.20928955078125, 0.2451324462890625, 0.280975341796875, 0.3168182373046875, 0.3526611328125, 0.3885040283203125, 0.424346923828125, 0.4601898193359375, 0.49603271484375, 0.5318756103515625, 0.567718505859375, 0.6035614013671875, 0.639404296875, 0.6752471923828125, 0.711090087890625, 0.7469329833984375, 0.78277587890625, 0.8186187744140625, 0.854461669921875, 0.8903045654296875, 0.9261474609375, 0.9619903564453125, 0.997833251953125, 1.0336761474609375, 1.06951904296875, 1.1053619384765625, 1.141204833984375, 1.1770477294921875, 1.212890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 9.0, 4.0, 9.0, 12.0, 16.0, 25.0, 33.0, 47.0, 38.0, 52.0, 60.0, 71.0, 64.0, 87.0, 71.0, 72.0, 48.0, 73.0, 49.0, 40.0, 34.0, 16.0, 18.0, 17.0, 11.0, 8.0, 9.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.63818359375, -0.62091064453125, -0.6036376953125, -0.58636474609375, -0.569091796875, -0.55181884765625, -0.5345458984375, -0.51727294921875, -0.5, -0.48272705078125, -0.4654541015625, -0.44818115234375, -0.430908203125, -0.41363525390625, -0.3963623046875, -0.37908935546875, -0.36181640625, -0.34454345703125, -0.3272705078125, -0.30999755859375, -0.292724609375, -0.27545166015625, -0.2581787109375, -0.24090576171875, -0.2236328125, -0.20635986328125, -0.1890869140625, -0.17181396484375, -0.154541015625, -0.13726806640625, -0.1199951171875, -0.10272216796875, -0.08544921875, -0.06817626953125, -0.0509033203125, -0.03363037109375, -0.016357421875, 0.00091552734375, 0.0181884765625, 0.03546142578125, 0.052734375, 0.07000732421875, 0.0872802734375, 0.10455322265625, 0.121826171875, 0.13909912109375, 0.1563720703125, 0.17364501953125, 0.19091796875, 0.20819091796875, 0.2254638671875, 0.24273681640625, 0.260009765625, 0.27728271484375, 0.2945556640625, 0.31182861328125, 0.3291015625, 0.34637451171875, 0.3636474609375, 0.38092041015625, 0.398193359375, 0.41546630859375, 0.4327392578125, 0.45001220703125, 0.46728515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 11.0, 27.0, 31.0, 56.0, 91.0, 190.0, 454.0, 1105.0, 3388.0, 17654.0, 260446.0, 702641.0, 52721.0, 6663.0, 1791.0, 670.0, 279.0, 149.0, 73.0, 37.0, 31.0, 20.0, 3.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.818359375, -0.7963790893554688, -0.7743988037109375, -0.7524185180664062, -0.730438232421875, -0.7084579467773438, -0.6864776611328125, -0.6644973754882812, -0.64251708984375, -0.6205368041992188, -0.5985565185546875, -0.5765762329101562, -0.554595947265625, -0.5326156616210938, -0.5106353759765625, -0.48865509033203125, -0.4666748046875, -0.44469451904296875, -0.4227142333984375, -0.40073394775390625, -0.378753662109375, -0.35677337646484375, -0.3347930908203125, -0.31281280517578125, -0.29083251953125, -0.26885223388671875, -0.2468719482421875, -0.22489166259765625, -0.202911376953125, -0.18093109130859375, -0.1589508056640625, -0.13697052001953125, -0.114990234375, -0.09300994873046875, -0.0710296630859375, -0.04904937744140625, -0.027069091796875, -0.00508880615234375, 0.0168914794921875, 0.03887176513671875, 0.06085205078125, 0.08283233642578125, 0.1048126220703125, 0.12679290771484375, 0.148773193359375, 0.17075347900390625, 0.1927337646484375, 0.21471405029296875, 0.2366943359375, 0.25867462158203125, 0.2806549072265625, 0.30263519287109375, 0.324615478515625, 0.34659576416015625, 0.3685760498046875, 0.39055633544921875, 0.41253662109375, 0.43451690673828125, 0.4564971923828125, 0.47847747802734375, 0.500457763671875, 0.5224380493164062, 0.5444183349609375, 0.5663986206054688, 0.58837890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 8.0, 7.0, 6.0, 15.0, 14.0, 20.0, 20.0, 30.0, 48.0, 60.0, 67.0, 87.0, 96.0, 106.0, 96.0, 67.0, 68.0, 43.0, 30.0, 25.0, 21.0, 25.0, 7.0, 8.0, 10.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00011032819747924805, -0.00010719709098339081, -0.00010406598448753357, -0.00010093487799167633, -9.780377149581909e-05, -9.467266499996185e-05, -9.154155850410461e-05, -8.841045200824738e-05, -8.527934551239014e-05, -8.21482390165329e-05, -7.901713252067566e-05, -7.588602602481842e-05, -7.275491952896118e-05, -6.962381303310394e-05, -6.64927065372467e-05, -6.336160004138947e-05, -6.0230493545532227e-05, -5.709938704967499e-05, -5.396828055381775e-05, -5.083717405796051e-05, -4.770606756210327e-05, -4.457496106624603e-05, -4.1443854570388794e-05, -3.8312748074531555e-05, -3.5181641578674316e-05, -3.205053508281708e-05, -2.891942858695984e-05, -2.57883220911026e-05, -2.265721559524536e-05, -1.9526109099388123e-05, -1.6395002603530884e-05, -1.3263896107673645e-05, -1.0132789611816406e-05, -7.0016831159591675e-06, -3.870576620101929e-06, -7.394701242446899e-07, 2.391636371612549e-06, 5.522742867469788e-06, 8.653849363327026e-06, 1.1784955859184265e-05, 1.4916062355041504e-05, 1.8047168850898743e-05, 2.117827534675598e-05, 2.430938184261322e-05, 2.744048833847046e-05, 3.05715948343277e-05, 3.3702701330184937e-05, 3.6833807826042175e-05, 3.9964914321899414e-05, 4.309602081775665e-05, 4.622712731361389e-05, 4.935823380947113e-05, 5.248934030532837e-05, 5.562044680118561e-05, 5.875155329704285e-05, 6.188265979290009e-05, 6.501376628875732e-05, 6.814487278461456e-05, 7.12759792804718e-05, 7.440708577632904e-05, 7.753819227218628e-05, 8.066929876804352e-05, 8.380040526390076e-05, 8.6931511759758e-05, 9.006261825561523e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 13.0, 19.0, 26.0, 49.0, 100.0, 176.0, 460.0, 1316.0, 5657.0, 71942.0, 896783.0, 64539.0, 5358.0, 1273.0, 427.0, 186.0, 85.0, 60.0, 26.0, 16.0, 20.0, 10.0, 3.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69287109375, -0.6633682250976562, -0.6338653564453125, -0.6043624877929688, -0.574859619140625, -0.5453567504882812, -0.5158538818359375, -0.48635101318359375, -0.45684814453125, -0.42734527587890625, -0.3978424072265625, -0.36833953857421875, -0.338836669921875, -0.30933380126953125, -0.2798309326171875, -0.25032806396484375, -0.2208251953125, -0.19132232666015625, -0.1618194580078125, -0.13231658935546875, -0.102813720703125, -0.07331085205078125, -0.0438079833984375, -0.01430511474609375, 0.01519775390625, 0.04470062255859375, 0.0742034912109375, 0.10370635986328125, 0.133209228515625, 0.16271209716796875, 0.1922149658203125, 0.22171783447265625, 0.251220703125, 0.28072357177734375, 0.3102264404296875, 0.33972930908203125, 0.369232177734375, 0.39873504638671875, 0.4282379150390625, 0.45774078369140625, 0.48724365234375, 0.5167465209960938, 0.5462493896484375, 0.5757522583007812, 0.605255126953125, 0.6347579956054688, 0.6642608642578125, 0.6937637329101562, 0.7232666015625, 0.7527694702148438, 0.7822723388671875, 0.8117752075195312, 0.841278076171875, 0.8707809448242188, 0.9002838134765625, 0.9297866821289062, 0.95928955078125, 0.9887924194335938, 1.0182952880859375, 1.0477981567382812, 1.077301025390625, 1.1068038940429688, 1.1363067626953125, 1.1658096313476562, 1.1953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 17.0, 31.0, 32.0, 36.0, 77.0, 108.0, 114.0, 134.0, 120.0, 97.0, 77.0, 50.0, 23.0, 24.0, 21.0, 9.0, 6.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29296875, -0.28058624267578125, -0.2682037353515625, -0.25582122802734375, -0.243438720703125, -0.23105621337890625, -0.2186737060546875, -0.20629119873046875, -0.19390869140625, -0.18152618408203125, -0.1691436767578125, -0.15676116943359375, -0.144378662109375, -0.13199615478515625, -0.1196136474609375, -0.10723114013671875, -0.0948486328125, -0.08246612548828125, -0.0700836181640625, -0.05770111083984375, -0.045318603515625, -0.03293609619140625, -0.0205535888671875, -0.00817108154296875, 0.00421142578125, 0.01659393310546875, 0.0289764404296875, 0.04135894775390625, 0.053741455078125, 0.06612396240234375, 0.0785064697265625, 0.09088897705078125, 0.103271484375, 0.11565399169921875, 0.1280364990234375, 0.14041900634765625, 0.152801513671875, 0.16518402099609375, 0.1775665283203125, 0.18994903564453125, 0.20233154296875, 0.21471405029296875, 0.2270965576171875, 0.23947906494140625, 0.251861572265625, 0.26424407958984375, 0.2766265869140625, 0.28900909423828125, 0.3013916015625, 0.31377410888671875, 0.3261566162109375, 0.33853912353515625, 0.350921630859375, 0.36330413818359375, 0.3756866455078125, 0.38806915283203125, 0.40045166015625, 0.41283416748046875, 0.4252166748046875, 0.43759918212890625, 0.449981689453125, 0.46236419677734375, 0.4747467041015625, 0.48712921142578125, 0.49951171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 18.0, 47.0, 64.0, 118.0, 173.0, 214.0, 174.0, 87.0, 49.0, 22.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.256625175476074, -6.062235355377197, -5.86784553527832, -5.673455238342285, -5.479065418243408, -5.284675598144531, -5.090285778045654, -4.895895957946777, -4.701505661010742, -4.507115840911865, -4.312726020812988, -4.118335723876953, -3.923945903778076, -3.729556083679199, -3.5351662635803223, -3.3407764434814453, -3.1463866233825684, -2.9519968032836914, -2.7576067447662354, -2.5632169246673584, -2.3688268661499023, -2.1744370460510254, -1.9800472259521484, -1.785657286643982, -1.5912673473358154, -1.396877408027649, -1.2024874687194824, -1.0080976486206055, -0.813707709312439, -0.6193177700042725, -0.4249279499053955, -0.230538010597229, -0.0361475944519043, 0.15824231505393982, 0.35263222455978394, 0.5470221042633057, 0.7414120435714722, 0.9358019828796387, 1.1301918029785156, 1.3245817422866821, 1.5189716815948486, 1.7133616209030151, 1.9077515602111816, 2.1021413803100586, 2.2965312004089355, 2.4909212589263916, 2.6853110790252686, 2.8797011375427246, 3.0740909576416016, 3.2684807777404785, 3.4628708362579346, 3.6572606563568115, 3.8516507148742676, 4.0460405349731445, 4.2404303550720215, 4.434820175170898, 4.629210472106934, 4.8236002922058105, 5.0179901123046875, 5.212380409240723, 5.4067702293396, 5.601160049438477, 5.7955498695373535, 5.9899396896362305, 6.184329509735107]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 7.0, 3.0, 9.0, 12.0, 17.0, 10.0, 18.0, 30.0, 41.0, 39.0, 55.0, 57.0, 42.0, 75.0, 72.0, 72.0, 74.0, 69.0, 54.0, 38.0, 38.0, 42.0, 33.0, 26.0, 19.0, 12.0, 9.0, 11.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0189208984375, -3.9207749366760254, -3.82262921333313, -3.7244832515716553, -3.6263375282287598, -3.528191566467285, -3.4300458431243896, -3.331899881362915, -3.2337541580200195, -3.135608196258545, -3.0374624729156494, -2.939316511154175, -2.8411707878112793, -2.7430248260498047, -2.644879102706909, -2.5467331409454346, -2.448587417602539, -2.3504414558410645, -2.252295732498169, -2.1541497707366943, -2.056004047393799, -1.9578582048416138, -1.8597123622894287, -1.761566400527954, -1.6634204387664795, -1.5652745962142944, -1.4671287536621094, -1.3689829111099243, -1.2708370685577393, -1.1726912260055542, -1.0745453834533691, -0.9763994812965393, -0.878253698348999, -0.780107855796814, -0.6819620132446289, -0.5838161706924438, -0.4856702983379364, -0.38752445578575134, -0.2893785834312439, -0.19123274087905884, -0.09308689832687378, 0.005058951675891876, 0.10320480167865753, 0.20135065913200378, 0.29949650168418884, 0.3976423442363739, 0.49578821659088135, 0.5939340591430664, 0.6920799016952515, 0.7902257442474365, 0.8883715867996216, 0.9865174293518066, 1.0846632719039917, 1.1828091144561768, 1.2809550762176514, 1.3791007995605469, 1.4772467613220215, 1.5753926038742065, 1.6735384464263916, 1.7716842889785767, 1.8698301315307617, 1.9679759740829468, 2.066121816635132, 2.1642677783966064, 2.262413501739502]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 8.0, 6.0, 3.0, 13.0, 11.0, 26.0, 33.0, 40.0, 45.0, 75.0, 111.0, 123.0, 204.0, 292.0, 456.0, 1123.0, 3066.0, 15026.0, 175363.0, 3830082.0, 149012.0, 14101.0, 3065.0, 1079.0, 449.0, 201.0, 95.0, 73.0, 38.0, 18.0, 19.0, 10.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.59765625, -2.5318450927734375, -2.466033935546875, -2.4002227783203125, -2.33441162109375, -2.2686004638671875, -2.202789306640625, -2.1369781494140625, -2.0711669921875, -2.0053558349609375, -1.939544677734375, -1.8737335205078125, -1.80792236328125, -1.7421112060546875, -1.676300048828125, -1.6104888916015625, -1.544677734375, -1.4788665771484375, -1.413055419921875, -1.3472442626953125, -1.28143310546875, -1.2156219482421875, -1.149810791015625, -1.0839996337890625, -1.0181884765625, -0.9523773193359375, -0.886566162109375, -0.8207550048828125, -0.75494384765625, -0.6891326904296875, -0.623321533203125, -0.5575103759765625, -0.49169921875, -0.4258880615234375, -0.360076904296875, -0.2942657470703125, -0.22845458984375, -0.1626434326171875, -0.096832275390625, -0.0310211181640625, 0.0347900390625, 0.1006011962890625, 0.166412353515625, 0.2322235107421875, 0.29803466796875, 0.3638458251953125, 0.429656982421875, 0.4954681396484375, 0.561279296875, 0.6270904541015625, 0.692901611328125, 0.7587127685546875, 0.82452392578125, 0.8903350830078125, 0.956146240234375, 1.0219573974609375, 1.0877685546875, 1.1535797119140625, 1.219390869140625, 1.2852020263671875, 1.35101318359375, 1.4168243408203125, 1.482635498046875, 1.5484466552734375, 1.6142578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 15.0, 17.0, 25.0, 49.0, 61.0, 78.0, 99.0, 116.0, 123.0, 103.0, 82.0, 71.0, 56.0, 33.0, 24.0, 15.0, 8.0, 9.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.237060546875, -0.23192787170410156, -0.22679519653320312, -0.2216625213623047, -0.21652984619140625, -0.2113971710205078, -0.20626449584960938, -0.20113182067871094, -0.1959991455078125, -0.19086647033691406, -0.18573379516601562, -0.1806011199951172, -0.17546844482421875, -0.1703357696533203, -0.16520309448242188, -0.16007041931152344, -0.154937744140625, -0.14980506896972656, -0.14467239379882812, -0.1395397186279297, -0.13440704345703125, -0.1292743682861328, -0.12414169311523438, -0.11900901794433594, -0.1138763427734375, -0.10874366760253906, -0.10361099243164062, -0.09847831726074219, -0.09334564208984375, -0.08821296691894531, -0.08308029174804688, -0.07794761657714844, -0.07281494140625, -0.06768226623535156, -0.06254959106445312, -0.05741691589355469, -0.05228424072265625, -0.04715156555175781, -0.042018890380859375, -0.03688621520996094, -0.0317535400390625, -0.026620864868164062, -0.021488189697265625, -0.016355514526367188, -0.01122283935546875, -0.0060901641845703125, -0.000957489013671875, 0.0041751861572265625, 0.009307861328125, 0.014440536499023438, 0.019573211669921875, 0.024705886840820312, 0.02983856201171875, 0.03497123718261719, 0.040103912353515625, 0.04523658752441406, 0.0503692626953125, 0.05550193786621094, 0.060634613037109375, 0.06576728820800781, 0.07089996337890625, 0.07603263854980469, 0.08116531372070312, 0.08629798889160156, 0.0914306640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 3.0, 11.0, 18.0, 16.0, 25.0, 37.0, 40.0, 57.0, 116.0, 225.0, 652.0, 2064.0, 9118.0, 409306.0, 3754673.0, 13925.0, 2632.0, 716.0, 275.0, 127.0, 72.0, 54.0, 31.0, 31.0, 14.0, 16.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28515625, -4.137939453125, -3.99072265625, -3.843505859375, -3.6962890625, -3.549072265625, -3.40185546875, -3.254638671875, -3.107421875, -2.960205078125, -2.81298828125, -2.665771484375, -2.5185546875, -2.371337890625, -2.22412109375, -2.076904296875, -1.9296875, -1.782470703125, -1.63525390625, -1.488037109375, -1.3408203125, -1.193603515625, -1.04638671875, -0.899169921875, -0.751953125, -0.604736328125, -0.45751953125, -0.310302734375, -0.1630859375, -0.015869140625, 0.13134765625, 0.278564453125, 0.42578125, 0.572998046875, 0.72021484375, 0.867431640625, 1.0146484375, 1.161865234375, 1.30908203125, 1.456298828125, 1.603515625, 1.750732421875, 1.89794921875, 2.045166015625, 2.1923828125, 2.339599609375, 2.48681640625, 2.634033203125, 2.78125, 2.928466796875, 3.07568359375, 3.222900390625, 3.3701171875, 3.517333984375, 3.66455078125, 3.811767578125, 3.958984375, 4.106201171875, 4.25341796875, 4.400634765625, 4.5478515625, 4.695068359375, 4.84228515625, 4.989501953125, 5.13671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 10.0, 16.0, 23.0, 35.0, 98.0, 247.0, 761.0, 1922.0, 576.0, 197.0, 81.0, 32.0, 29.0, 7.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.0048828125, -0.9827499389648438, -0.9606170654296875, -0.9384841918945312, -0.916351318359375, -0.8942184448242188, -0.8720855712890625, -0.8499526977539062, -0.82781982421875, -0.8056869506835938, -0.7835540771484375, -0.7614212036132812, -0.739288330078125, -0.7171554565429688, -0.6950225830078125, -0.6728897094726562, -0.6507568359375, -0.6286239624023438, -0.6064910888671875, -0.5843582153320312, -0.562225341796875, -0.5400924682617188, -0.5179595947265625, -0.49582672119140625, -0.47369384765625, -0.45156097412109375, -0.4294281005859375, -0.40729522705078125, -0.385162353515625, -0.36302947998046875, -0.3408966064453125, -0.31876373291015625, -0.296630859375, -0.27449798583984375, -0.2523651123046875, -0.23023223876953125, -0.208099365234375, -0.18596649169921875, -0.1638336181640625, -0.14170074462890625, -0.11956787109375, -0.09743499755859375, -0.0753021240234375, -0.05316925048828125, -0.031036376953125, -0.00890350341796875, 0.0132293701171875, 0.03536224365234375, 0.0574951171875, 0.07962799072265625, 0.1017608642578125, 0.12389373779296875, 0.146026611328125, 0.16815948486328125, 0.1902923583984375, 0.21242523193359375, 0.23455810546875, 0.25669097900390625, 0.2788238525390625, 0.30095672607421875, 0.323089599609375, 0.34522247314453125, 0.3673553466796875, 0.38948822021484375, 0.41162109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 17.0, 23.0, 82.0, 192.0, 264.0, 209.0, 120.0, 45.0, 19.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.52221965789795, -9.303872108459473, -9.085525512695312, -8.867177963256836, -8.648831367492676, -8.4304838180542, -8.212137222290039, -7.9937896728515625, -7.775442600250244, -7.557095527648926, -7.338748455047607, -7.120401382446289, -6.9020538330078125, -6.683706760406494, -6.465359687805176, -6.247012615203857, -6.028665542602539, -5.810318470001221, -5.591971397399902, -5.373623847961426, -5.155276775360107, -4.936929702758789, -4.718582630157471, -4.500235557556152, -4.281888008117676, -4.063540935516357, -3.84519362449646, -3.6268465518951416, -3.4084994792938232, -3.190152168273926, -2.9718050956726074, -2.753458023071289, -2.5351109504699707, -2.3167638778686523, -2.098416566848755, -1.8800694942474365, -1.6617224216461182, -1.4433752298355103, -1.2250280380249023, -1.006680965423584, -0.7883337736129761, -0.5699866414070129, -0.3516394793987274, -0.1332923173904419, 0.08505481481552124, 0.3034019470214844, 0.5217491388320923, 0.7400962114334106, 0.9584434032440186, 1.1767905950546265, 1.3951376676559448, 1.6134848594665527, 1.831831932067871, 2.0501790046691895, 2.268526315689087, 2.4868733882904053, 2.7052206993103027, 2.923567771911621, 3.1419150829315186, 3.360262155532837, 3.5786092281341553, 3.7969565391540527, 4.015303611755371, 4.2336506843566895, 4.451997756958008]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 10.0, 15.0, 20.0, 32.0, 45.0, 48.0, 60.0, 73.0, 87.0, 84.0, 75.0, 102.0, 75.0, 65.0, 65.0, 45.0, 20.0, 24.0, 19.0, 7.0, 10.0, 10.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4079484939575195, -2.3296139240264893, -2.251279354095459, -2.1729447841644287, -2.0946102142333984, -2.016275644302368, -1.937941074371338, -1.8596065044403076, -1.7812719345092773, -1.702937364578247, -1.6246027946472168, -1.5462682247161865, -1.4679336547851562, -1.389599084854126, -1.3112645149230957, -1.2329299449920654, -1.1545952558517456, -1.0762606859207153, -0.9979261159896851, -0.9195915460586548, -0.8412569761276245, -0.7629224061965942, -0.6845877766609192, -0.6062532067298889, -0.5279186367988586, -0.44958406686782837, -0.3712494969367981, -0.29291489720344543, -0.21458032727241516, -0.1362457573413849, -0.05791115760803223, 0.020423412322998047, 0.09875798225402832, 0.1770925521850586, 0.25542712211608887, 0.33376172184944153, 0.4120962917804718, 0.4904308617115021, 0.5687654614448547, 0.647100031375885, 0.7254346013069153, 0.8037691712379456, 0.8821037411689758, 0.9604383707046509, 1.0387729406356812, 1.1171075105667114, 1.1954420804977417, 1.273776650428772, 1.3521112203598022, 1.4304457902908325, 1.5087803602218628, 1.587114930152893, 1.6654495000839233, 1.7437840700149536, 1.8221187591552734, 1.9004533290863037, 1.978787899017334, 2.0571224689483643, 2.1354570388793945, 2.213791608810425, 2.292126178741455, 2.3704607486724854, 2.4487953186035156, 2.527129888534546, 2.605464458465576]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 12.0, 16.0, 11.0, 15.0, 31.0, 33.0, 54.0, 83.0, 104.0, 146.0, 225.0, 329.0, 581.0, 1036.0, 2288.0, 8143.0, 49820.0, 496934.0, 434351.0, 42488.0, 7073.0, 2126.0, 1004.0, 531.0, 344.0, 208.0, 146.0, 100.0, 91.0, 48.0, 39.0, 30.0, 21.0, 28.0, 15.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.37890625, -1.3328857421875, -1.286865234375, -1.2408447265625, -1.19482421875, -1.1488037109375, -1.102783203125, -1.0567626953125, -1.0107421875, -0.9647216796875, -0.918701171875, -0.8726806640625, -0.82666015625, -0.7806396484375, -0.734619140625, -0.6885986328125, -0.642578125, -0.5965576171875, -0.550537109375, -0.5045166015625, -0.45849609375, -0.4124755859375, -0.366455078125, -0.3204345703125, -0.2744140625, -0.2283935546875, -0.182373046875, -0.1363525390625, -0.09033203125, -0.0443115234375, 0.001708984375, 0.0477294921875, 0.09375, 0.1397705078125, 0.185791015625, 0.2318115234375, 0.27783203125, 0.3238525390625, 0.369873046875, 0.4158935546875, 0.4619140625, 0.5079345703125, 0.553955078125, 0.5999755859375, 0.64599609375, 0.6920166015625, 0.738037109375, 0.7840576171875, 0.830078125, 0.8760986328125, 0.922119140625, 0.9681396484375, 1.01416015625, 1.0601806640625, 1.106201171875, 1.1522216796875, 1.1982421875, 1.2442626953125, 1.290283203125, 1.3363037109375, 1.38232421875, 1.4283447265625, 1.474365234375, 1.5203857421875, 1.56640625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 7.0, 13.0, 31.0, 52.0, 66.0, 96.0, 110.0, 132.0, 129.0, 126.0, 71.0, 69.0, 32.0, 22.0, 15.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.284912109375, -0.27809715270996094, -0.2712821960449219, -0.2644672393798828, -0.25765228271484375, -0.2508373260498047, -0.24402236938476562, -0.23720741271972656, -0.2303924560546875, -0.22357749938964844, -0.21676254272460938, -0.2099475860595703, -0.20313262939453125, -0.1963176727294922, -0.18950271606445312, -0.18268775939941406, -0.175872802734375, -0.16905784606933594, -0.16224288940429688, -0.1554279327392578, -0.14861297607421875, -0.1417980194091797, -0.13498306274414062, -0.12816810607910156, -0.1213531494140625, -0.11453819274902344, -0.10772323608398438, -0.10090827941894531, -0.09409332275390625, -0.08727836608886719, -0.08046340942382812, -0.07364845275878906, -0.06683349609375, -0.06001853942871094, -0.053203582763671875, -0.04638862609863281, -0.03957366943359375, -0.03275871276855469, -0.025943756103515625, -0.019128799438476562, -0.0123138427734375, -0.0054988861083984375, 0.001316070556640625, 0.008131027221679688, 0.01494598388671875, 0.021760940551757812, 0.028575897216796875, 0.03539085388183594, 0.042205810546875, 0.04902076721191406, 0.055835723876953125, 0.06265068054199219, 0.06946563720703125, 0.07628059387207031, 0.08309555053710938, 0.08991050720214844, 0.0967254638671875, 0.10354042053222656, 0.11035537719726562, 0.11717033386230469, 0.12398529052734375, 0.1308002471923828, 0.13761520385742188, 0.14443016052246094, 0.1512451171875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 12.0, 8.0, 10.0, 17.0, 26.0, 55.0, 49.0, 79.0, 131.0, 206.0, 282.0, 527.0, 1090.0, 2384.0, 6030.0, 18975.0, 67774.0, 230811.0, 417944.0, 213078.0, 61514.0, 17313.0, 5682.0, 2170.0, 970.0, 504.0, 302.0, 189.0, 111.0, 106.0, 67.0, 38.0, 28.0, 21.0, 18.0, 9.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.524200439453125, -0.50640869140625, -0.488616943359375, -0.4708251953125, -0.453033447265625, -0.43524169921875, -0.417449951171875, -0.399658203125, -0.381866455078125, -0.36407470703125, -0.346282958984375, -0.3284912109375, -0.310699462890625, -0.29290771484375, -0.275115966796875, -0.25732421875, -0.239532470703125, -0.22174072265625, -0.203948974609375, -0.1861572265625, -0.168365478515625, -0.15057373046875, -0.132781982421875, -0.114990234375, -0.097198486328125, -0.07940673828125, -0.061614990234375, -0.0438232421875, -0.026031494140625, -0.00823974609375, 0.009552001953125, 0.02734375, 0.045135498046875, 0.06292724609375, 0.080718994140625, 0.0985107421875, 0.116302490234375, 0.13409423828125, 0.151885986328125, 0.169677734375, 0.187469482421875, 0.20526123046875, 0.223052978515625, 0.2408447265625, 0.258636474609375, 0.27642822265625, 0.294219970703125, 0.31201171875, 0.329803466796875, 0.34759521484375, 0.365386962890625, 0.3831787109375, 0.400970458984375, 0.41876220703125, 0.436553955078125, 0.454345703125, 0.472137451171875, 0.48992919921875, 0.507720947265625, 0.5255126953125, 0.543304443359375, 0.56109619140625, 0.578887939453125, 0.5966796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 8.0, 7.0, 5.0, 6.0, 15.0, 11.0, 16.0, 20.0, 16.0, 19.0, 22.0, 21.0, 34.0, 34.0, 43.0, 34.0, 44.0, 56.0, 48.0, 49.0, 42.0, 44.0, 43.0, 46.0, 47.0, 41.0, 23.0, 36.0, 24.0, 39.0, 12.0, 22.0, 10.0, 8.0, 19.0, 6.0, 11.0, 5.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.375, -0.36243438720703125, -0.3498687744140625, -0.33730316162109375, -0.324737548828125, -0.31217193603515625, -0.2996063232421875, -0.28704071044921875, -0.27447509765625, -0.26190948486328125, -0.2493438720703125, -0.23677825927734375, -0.224212646484375, -0.21164703369140625, -0.1990814208984375, -0.18651580810546875, -0.1739501953125, -0.16138458251953125, -0.1488189697265625, -0.13625335693359375, -0.123687744140625, -0.11112213134765625, -0.0985565185546875, -0.08599090576171875, -0.07342529296875, -0.06085968017578125, -0.0482940673828125, -0.03572845458984375, -0.023162841796875, -0.01059722900390625, 0.0019683837890625, 0.01453399658203125, 0.027099609375, 0.03966522216796875, 0.0522308349609375, 0.06479644775390625, 0.077362060546875, 0.08992767333984375, 0.1024932861328125, 0.11505889892578125, 0.12762451171875, 0.14019012451171875, 0.1527557373046875, 0.16532135009765625, 0.177886962890625, 0.19045257568359375, 0.2030181884765625, 0.21558380126953125, 0.2281494140625, 0.24071502685546875, 0.2532806396484375, 0.26584625244140625, 0.278411865234375, 0.29097747802734375, 0.3035430908203125, 0.31610870361328125, 0.32867431640625, 0.34123992919921875, 0.3538055419921875, 0.36637115478515625, 0.378936767578125, 0.39150238037109375, 0.4040679931640625, 0.41663360595703125, 0.42919921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 8.0, 8.0, 11.0, 22.0, 20.0, 32.0, 40.0, 89.0, 137.0, 189.0, 367.0, 689.0, 1485.0, 3825.0, 12736.0, 53562.0, 243581.0, 473372.0, 199019.0, 42895.0, 10389.0, 3252.0, 1288.0, 654.0, 300.0, 200.0, 119.0, 77.0, 52.0, 38.0, 26.0, 15.0, 15.0, 14.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.332763671875, -0.3218269348144531, -0.31089019775390625, -0.2999534606933594, -0.2890167236328125, -0.2780799865722656, -0.26714324951171875, -0.2562065124511719, -0.245269775390625, -0.23433303833007812, -0.22339630126953125, -0.21245956420898438, -0.2015228271484375, -0.19058609008789062, -0.17964935302734375, -0.16871261596679688, -0.15777587890625, -0.14683914184570312, -0.13590240478515625, -0.12496566772460938, -0.1140289306640625, -0.10309219360351562, -0.09215545654296875, -0.08121871948242188, -0.070281982421875, -0.059345245361328125, -0.04840850830078125, -0.037471771240234375, -0.0265350341796875, -0.015598297119140625, -0.00466156005859375, 0.006275177001953125, 0.0172119140625, 0.028148651123046875, 0.03908538818359375, 0.050022125244140625, 0.0609588623046875, 0.07189559936523438, 0.08283233642578125, 0.09376907348632812, 0.104705810546875, 0.11564254760742188, 0.12657928466796875, 0.13751602172851562, 0.1484527587890625, 0.15938949584960938, 0.17032623291015625, 0.18126296997070312, 0.19219970703125, 0.20313644409179688, 0.21407318115234375, 0.22500991821289062, 0.2359466552734375, 0.24688339233398438, 0.25782012939453125, 0.2687568664550781, 0.279693603515625, 0.2906303405761719, 0.30156707763671875, 0.3125038146972656, 0.3234405517578125, 0.3343772888183594, 0.34531402587890625, 0.3562507629394531, 0.3671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 12.0, 13.0, 15.0, 15.0, 30.0, 52.0, 38.0, 72.0, 91.0, 91.0, 97.0, 87.0, 92.0, 85.0, 59.0, 40.0, 35.0, 18.0, 18.0, 13.0, 11.0, 5.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001112222671508789, -0.00010801013559103012, -0.00010479800403118134, -0.00010158587247133255, -9.837374091148376e-05, -9.516160935163498e-05, -9.19494777917862e-05, -8.873734623193741e-05, -8.552521467208862e-05, -8.231308311223984e-05, -7.910095155239105e-05, -7.588881999254227e-05, -7.267668843269348e-05, -6.94645568728447e-05, -6.625242531299591e-05, -6.304029375314713e-05, -5.982816219329834e-05, -5.6616030633449554e-05, -5.340389907360077e-05, -5.0191767513751984e-05, -4.69796359539032e-05, -4.376750439405441e-05, -4.055537283420563e-05, -3.734324127435684e-05, -3.413110971450806e-05, -3.091897815465927e-05, -2.7706846594810486e-05, -2.44947150349617e-05, -2.1282583475112915e-05, -1.807045191526413e-05, -1.4858320355415344e-05, -1.1646188795566559e-05, -8.434057235717773e-06, -5.221925675868988e-06, -2.0097941160202026e-06, 1.2023374438285828e-06, 4.414469003677368e-06, 7.6266005635261536e-06, 1.0838732123374939e-05, 1.4050863683223724e-05, 1.726299524307251e-05, 2.0475126802921295e-05, 2.368725836277008e-05, 2.6899389922618866e-05, 3.011152148246765e-05, 3.332365304231644e-05, 3.653578460216522e-05, 3.974791616201401e-05, 4.296004772186279e-05, 4.617217928171158e-05, 4.9384310841560364e-05, 5.259644240140915e-05, 5.5808573961257935e-05, 5.902070552110672e-05, 6.22328370809555e-05, 6.544496864080429e-05, 6.865710020065308e-05, 7.186923176050186e-05, 7.508136332035065e-05, 7.829349488019943e-05, 8.150562644004822e-05, 8.4717757999897e-05, 8.792988955974579e-05, 9.114202111959457e-05, 9.435415267944336e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 11.0, 28.0, 34.0, 53.0, 79.0, 172.0, 397.0, 1009.0, 3482.0, 21691.0, 311556.0, 637844.0, 62870.0, 6701.0, 1582.0, 561.0, 218.0, 123.0, 72.0, 32.0, 13.0, 12.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.79931640625, -0.7799186706542969, -0.7605209350585938, -0.7411231994628906, -0.7217254638671875, -0.7023277282714844, -0.6829299926757812, -0.6635322570800781, -0.644134521484375, -0.6247367858886719, -0.6053390502929688, -0.5859413146972656, -0.5665435791015625, -0.5471458435058594, -0.5277481079101562, -0.5083503723144531, -0.48895263671875, -0.4695549011230469, -0.45015716552734375, -0.4307594299316406, -0.4113616943359375, -0.3919639587402344, -0.37256622314453125, -0.3531684875488281, -0.333770751953125, -0.3143730163574219, -0.29497528076171875, -0.2755775451660156, -0.2561798095703125, -0.23678207397460938, -0.21738433837890625, -0.19798660278320312, -0.1785888671875, -0.15919113159179688, -0.13979339599609375, -0.12039566040039062, -0.1009979248046875, -0.08160018920898438, -0.06220245361328125, -0.042804718017578125, -0.023406982421875, -0.004009246826171875, 0.01538848876953125, 0.034786224365234375, 0.0541839599609375, 0.07358169555664062, 0.09297943115234375, 0.11237716674804688, 0.13177490234375, 0.15117263793945312, 0.17057037353515625, 0.18996810913085938, 0.2093658447265625, 0.22876358032226562, 0.24816131591796875, 0.2675590515136719, 0.286956787109375, 0.3063545227050781, 0.32575225830078125, 0.3451499938964844, 0.3645477294921875, 0.3839454650878906, 0.40334320068359375, 0.4227409362792969, 0.442138671875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 5.0, 6.0, 8.0, 24.0, 35.0, 32.0, 59.0, 91.0, 114.0, 112.0, 139.0, 112.0, 102.0, 69.0, 35.0, 24.0, 21.0, 12.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19970703125, -0.18547821044921875, -0.1712493896484375, -0.15702056884765625, -0.142791748046875, -0.12856292724609375, -0.1143341064453125, -0.10010528564453125, -0.08587646484375, -0.07164764404296875, -0.0574188232421875, -0.04319000244140625, -0.028961181640625, -0.01473236083984375, -0.0005035400390625, 0.01372528076171875, 0.0279541015625, 0.04218292236328125, 0.0564117431640625, 0.07064056396484375, 0.084869384765625, 0.09909820556640625, 0.1133270263671875, 0.12755584716796875, 0.14178466796875, 0.15601348876953125, 0.1702423095703125, 0.18447113037109375, 0.198699951171875, 0.21292877197265625, 0.2271575927734375, 0.24138641357421875, 0.255615234375, 0.26984405517578125, 0.2840728759765625, 0.29830169677734375, 0.312530517578125, 0.32675933837890625, 0.3409881591796875, 0.35521697998046875, 0.36944580078125, 0.38367462158203125, 0.3979034423828125, 0.41213226318359375, 0.426361083984375, 0.44058990478515625, 0.4548187255859375, 0.46904754638671875, 0.4832763671875, 0.49750518798828125, 0.5117340087890625, 0.5259628295898438, 0.540191650390625, 0.5544204711914062, 0.5686492919921875, 0.5828781127929688, 0.59710693359375, 0.6113357543945312, 0.6255645751953125, 0.6397933959960938, 0.654022216796875, 0.6682510375976562, 0.6824798583984375, 0.6967086791992188, 0.7109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 13.0, 20.0, 73.0, 175.0, 242.0, 237.0, 163.0, 50.0, 21.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.493064880371094, -10.223384857177734, -9.953704833984375, -9.684024810791016, -9.414344787597656, -9.144664764404297, -8.874984741210938, -8.605304718017578, -8.335624694824219, -8.06594467163086, -7.7962646484375, -7.526584625244141, -7.256904602050781, -6.987224578857422, -6.7175445556640625, -6.447864532470703, -6.178184509277344, -5.908504486083984, -5.638824462890625, -5.369144439697266, -5.099464416503906, -4.829784393310547, -4.5601043701171875, -4.290424346923828, -4.020744323730469, -3.7510643005371094, -3.48138427734375, -3.2117042541503906, -2.9420242309570312, -2.672344207763672, -2.4026641845703125, -2.132984161376953, -1.8633041381835938, -1.5936241149902344, -1.323944091796875, -1.0542640686035156, -0.7845840454101562, -0.5149040222167969, -0.2452239990234375, 0.024456024169921875, 0.29413604736328125, 0.5638160705566406, 0.83349609375, 1.1031761169433594, 1.3728561401367188, 1.6425361633300781, 1.9122161865234375, 2.181896209716797, 2.4515762329101562, 2.7212562561035156, 2.990936279296875, 3.2606163024902344, 3.5302963256835938, 3.799976348876953, 4.0696563720703125, 4.339336395263672, 4.609016418457031, 4.878696441650391, 5.14837646484375, 5.418056488037109, 5.687736511230469, 5.957416534423828, 6.2270965576171875, 6.496776580810547, 6.766456604003906]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 13.0, 11.0, 19.0, 13.0, 27.0, 29.0, 30.0, 46.0, 50.0, 44.0, 57.0, 62.0, 69.0, 50.0, 59.0, 57.0, 68.0, 51.0, 42.0, 38.0, 35.0, 26.0, 27.0, 13.0, 12.0, 11.0, 5.0, 4.0, 9.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0462570190429688, -2.949765920639038, -2.8532748222351074, -2.7567834854125977, -2.660292387008667, -2.5638012886047363, -2.4673101902008057, -2.370819091796875, -2.2743279933929443, -2.1778368949890137, -2.081345796585083, -1.9848545789718628, -1.8883634805679321, -1.791872262954712, -1.6953811645507812, -1.5988900661468506, -1.5023988485336304, -1.4059077501296997, -1.3094165325164795, -1.2129254341125488, -1.1164343357086182, -1.0199432373046875, -0.9234520196914673, -0.8269609212875366, -0.7304697632789612, -0.6339786052703857, -0.5374875068664551, -0.44099634885787964, -0.3445052206516266, -0.24801409244537354, -0.1515229344367981, -0.05503183603286743, 0.04145932197570801, 0.13795045018196106, 0.2344415932893753, 0.33093273639678955, 0.4274238646030426, 0.5239149928092957, 0.6204061508178711, 0.7168972492218018, 0.8133884072303772, 0.9098795652389526, 1.0063706636428833, 1.1028618812561035, 1.1993529796600342, 1.2958440780639648, 1.3923351764678955, 1.4888262748718262, 1.5853174924850464, 1.681808590888977, 1.7782998085021973, 1.874790906906128, 1.9712820053100586, 2.0677731037139893, 2.16426420211792, 2.2607555389404297, 2.3572466373443604, 2.453737735748291, 2.5502288341522217, 2.6467199325561523, 2.743211269378662, 2.8397023677825928, 2.9361934661865234, 3.032684564590454, 3.1291756629943848]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 5.0, 11.0, 7.0, 14.0, 18.0, 12.0, 27.0, 32.0, 46.0, 50.0, 77.0, 100.0, 145.0, 200.0, 326.0, 447.0, 798.0, 1893.0, 6126.0, 34675.0, 1125523.0, 2970950.0, 41162.0, 7091.0, 2151.0, 945.0, 485.0, 315.0, 191.0, 133.0, 69.0, 70.0, 53.0, 37.0, 17.0, 19.0, 11.0, 6.0, 8.0, 5.0, 5.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.078125, -2.0170745849609375, -1.956024169921875, -1.8949737548828125, -1.83392333984375, -1.7728729248046875, -1.711822509765625, -1.6507720947265625, -1.5897216796875, -1.5286712646484375, -1.467620849609375, -1.4065704345703125, -1.34552001953125, -1.2844696044921875, -1.223419189453125, -1.1623687744140625, -1.101318359375, -1.0402679443359375, -0.979217529296875, -0.9181671142578125, -0.85711669921875, -0.7960662841796875, -0.735015869140625, -0.6739654541015625, -0.6129150390625, -0.5518646240234375, -0.490814208984375, -0.4297637939453125, -0.36871337890625, -0.3076629638671875, -0.246612548828125, -0.1855621337890625, -0.12451171875, -0.0634613037109375, -0.002410888671875, 0.0586395263671875, 0.11968994140625, 0.1807403564453125, 0.241790771484375, 0.3028411865234375, 0.3638916015625, 0.4249420166015625, 0.485992431640625, 0.5470428466796875, 0.60809326171875, 0.6691436767578125, 0.730194091796875, 0.7912445068359375, 0.852294921875, 0.9133453369140625, 0.974395751953125, 1.0354461669921875, 1.09649658203125, 1.1575469970703125, 1.218597412109375, 1.2796478271484375, 1.3406982421875, 1.4017486572265625, 1.462799072265625, 1.5238494873046875, 1.58489990234375, 1.6459503173828125, 1.707000732421875, 1.7680511474609375, 1.8291015625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 12.0, 23.0, 29.0, 45.0, 59.0, 75.0, 102.0, 108.0, 112.0, 116.0, 97.0, 62.0, 50.0, 34.0, 33.0, 19.0, 7.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.269287109375, -0.2627716064453125, -0.256256103515625, -0.2497406005859375, -0.24322509765625, -0.2367095947265625, -0.230194091796875, -0.2236785888671875, -0.2171630859375, -0.2106475830078125, -0.204132080078125, -0.1976165771484375, -0.19110107421875, -0.1845855712890625, -0.178070068359375, -0.1715545654296875, -0.1650390625, -0.1585235595703125, -0.152008056640625, -0.1454925537109375, -0.13897705078125, -0.1324615478515625, -0.125946044921875, -0.1194305419921875, -0.1129150390625, -0.1063995361328125, -0.099884033203125, -0.0933685302734375, -0.08685302734375, -0.0803375244140625, -0.073822021484375, -0.0673065185546875, -0.060791015625, -0.0542755126953125, -0.047760009765625, -0.0412445068359375, -0.03472900390625, -0.0282135009765625, -0.021697998046875, -0.0151824951171875, -0.0086669921875, -0.0021514892578125, 0.004364013671875, 0.0108795166015625, 0.01739501953125, 0.0239105224609375, 0.030426025390625, 0.0369415283203125, 0.04345703125, 0.0499725341796875, 0.056488037109375, 0.0630035400390625, 0.06951904296875, 0.0760345458984375, 0.082550048828125, 0.0890655517578125, 0.0955810546875, 0.1020965576171875, 0.108612060546875, 0.1151275634765625, 0.12164306640625, 0.1281585693359375, 0.134674072265625, 0.1411895751953125, 0.147705078125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 10.0, 15.0, 14.0, 19.0, 30.0, 57.0, 99.0, 138.0, 242.0, 419.0, 903.0, 2599.0, 9205.0, 44810.0, 512200.0, 3480231.0, 116132.0, 19412.0, 4903.0, 1457.0, 603.0, 278.0, 178.0, 99.0, 79.0, 37.0, 32.0, 28.0, 13.0, 12.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2001953125, -1.1629638671875, -1.125732421875, -1.0885009765625, -1.05126953125, -1.0140380859375, -0.976806640625, -0.9395751953125, -0.90234375, -0.8651123046875, -0.827880859375, -0.7906494140625, -0.75341796875, -0.7161865234375, -0.678955078125, -0.6417236328125, -0.6044921875, -0.5672607421875, -0.530029296875, -0.4927978515625, -0.45556640625, -0.4183349609375, -0.381103515625, -0.3438720703125, -0.306640625, -0.2694091796875, -0.232177734375, -0.1949462890625, -0.15771484375, -0.1204833984375, -0.083251953125, -0.0460205078125, -0.0087890625, 0.0284423828125, 0.065673828125, 0.1029052734375, 0.14013671875, 0.1773681640625, 0.214599609375, 0.2518310546875, 0.2890625, 0.3262939453125, 0.363525390625, 0.4007568359375, 0.43798828125, 0.4752197265625, 0.512451171875, 0.5496826171875, 0.5869140625, 0.6241455078125, 0.661376953125, 0.6986083984375, 0.73583984375, 0.7730712890625, 0.810302734375, 0.8475341796875, 0.884765625, 0.9219970703125, 0.959228515625, 0.9964599609375, 1.03369140625, 1.0709228515625, 1.108154296875, 1.1453857421875, 1.1826171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 14.0, 11.0, 30.0, 32.0, 74.0, 136.0, 271.0, 683.0, 1763.0, 508.0, 215.0, 110.0, 77.0, 53.0, 23.0, 25.0, 14.0, 9.0, 7.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333984375, -0.32131195068359375, -0.3086395263671875, -0.29596710205078125, -0.283294677734375, -0.27062225341796875, -0.2579498291015625, -0.24527740478515625, -0.23260498046875, -0.21993255615234375, -0.2072601318359375, -0.19458770751953125, -0.181915283203125, -0.16924285888671875, -0.1565704345703125, -0.14389801025390625, -0.1312255859375, -0.11855316162109375, -0.1058807373046875, -0.09320831298828125, -0.080535888671875, -0.06786346435546875, -0.0551910400390625, -0.04251861572265625, -0.02984619140625, -0.01717376708984375, -0.0045013427734375, 0.00817108154296875, 0.020843505859375, 0.03351593017578125, 0.0461883544921875, 0.05886077880859375, 0.071533203125, 0.08420562744140625, 0.0968780517578125, 0.10955047607421875, 0.122222900390625, 0.13489532470703125, 0.1475677490234375, 0.16024017333984375, 0.17291259765625, 0.18558502197265625, 0.1982574462890625, 0.21092987060546875, 0.223602294921875, 0.23627471923828125, 0.2489471435546875, 0.26161956787109375, 0.2742919921875, 0.28696441650390625, 0.2996368408203125, 0.31230926513671875, 0.324981689453125, 0.33765411376953125, 0.3503265380859375, 0.36299896240234375, 0.37567138671875, 0.38834381103515625, 0.4010162353515625, 0.41368865966796875, 0.426361083984375, 0.43903350830078125, 0.4517059326171875, 0.46437835693359375, 0.47705078125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 14.0, 25.0, 51.0, 86.0, 166.0, 191.0, 153.0, 124.0, 83.0, 46.0, 28.0, 6.0, 8.0, 2.0, 10.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3724277019500732, -2.2828047275543213, -2.1931819915771484, -2.1035590171813965, -2.0139360427856445, -1.9243131875991821, -1.8346903324127197, -1.7450673580169678, -1.6554445028305054, -1.565821647644043, -1.476198673248291, -1.3865758180618286, -1.2969529628753662, -1.2073299884796143, -1.1177071332931519, -1.0280842781066895, -0.9384613037109375, -0.8488383889198303, -0.7592154741287231, -0.6695926189422607, -0.5799697041511536, -0.4903467893600464, -0.400723934173584, -0.3111010193824768, -0.22147810459136963, -0.13185520470142365, -0.04223230481147766, 0.04739058017730713, 0.1370134949684143, 0.22663640975952148, 0.3162592649459839, 0.40588217973709106, 0.49550509452819824, 0.5851280093193054, 0.6747509241104126, 0.764373779296875, 0.8539966940879822, 0.9436196088790894, 1.0332424640655518, 1.1228654384613037, 1.2124882936477661, 1.3021111488342285, 1.3917341232299805, 1.4813569784164429, 1.5709798336029053, 1.6606028079986572, 1.7502256631851196, 1.839848518371582, 1.929471492767334, 2.019094467163086, 2.108717203140259, 2.1983401775360107, 2.2879631519317627, 2.3775858879089355, 2.4672088623046875, 2.5568318367004395, 2.6464548110961914, 2.7360777854919434, 2.825700521469116, 2.915323495864868, 3.00494647026062, 3.094569206237793, 3.184192180633545, 3.273815155029297, 3.3634378910064697]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 9.0, 17.0, 17.0, 25.0, 22.0, 30.0, 35.0, 35.0, 43.0, 50.0, 56.0, 57.0, 54.0, 61.0, 69.0, 59.0, 51.0, 56.0, 39.0, 41.0, 38.0, 24.0, 33.0, 16.0, 15.0, 11.0, 8.0, 10.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2504863739013672, -1.208534598350525, -1.166582703590393, -1.1246309280395508, -1.082679033279419, -1.0407272577285767, -0.9987754225730896, -0.9568235874176025, -0.9148717522621155, -0.8729199171066284, -0.8309680819511414, -0.7890162467956543, -0.747064471244812, -0.7051125764846802, -0.6631608009338379, -0.6212089657783508, -0.5792571306228638, -0.5373052954673767, -0.49535346031188965, -0.453401654958725, -0.4114498198032379, -0.36949798464775085, -0.3275461792945862, -0.2855943441390991, -0.24364250898361206, -0.201690673828125, -0.15973885357379913, -0.11778703331947327, -0.0758351981639862, -0.033883363008499146, 0.008068442344665527, 0.05002027750015259, 0.09197211265563965, 0.1339239478111267, 0.17587576806545258, 0.21782758831977844, 0.2597794234752655, 0.30173125863075256, 0.34368306398391724, 0.3856348991394043, 0.42758673429489136, 0.4695385694503784, 0.5114904046058655, 0.5534422397613525, 0.5953940153121948, 0.6373459100723267, 0.679297685623169, 0.721249520778656, 0.7632013559341431, 0.8051531910896301, 0.8471050262451172, 0.8890568017959595, 0.9310086965560913, 0.9729604721069336, 1.0149123668670654, 1.0568641424179077, 1.09881591796875, 1.1407676935195923, 1.1827195882797241, 1.2246713638305664, 1.2666232585906982, 1.3085750341415405, 1.3505268096923828, 1.3924787044525146, 1.4344305992126465]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 9.0, 6.0, 10.0, 12.0, 15.0, 32.0, 29.0, 43.0, 66.0, 103.0, 130.0, 229.0, 365.0, 608.0, 1338.0, 3888.0, 20911.0, 260750.0, 678350.0, 69107.0, 8355.0, 2150.0, 815.0, 441.0, 264.0, 138.0, 130.0, 74.0, 57.0, 30.0, 18.0, 23.0, 15.0, 10.0, 4.0, 11.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.763671875, -1.71063232421875, -1.6575927734375, -1.60455322265625, -1.551513671875, -1.49847412109375, -1.4454345703125, -1.39239501953125, -1.33935546875, -1.28631591796875, -1.2332763671875, -1.18023681640625, -1.127197265625, -1.07415771484375, -1.0211181640625, -0.96807861328125, -0.9150390625, -0.86199951171875, -0.8089599609375, -0.75592041015625, -0.702880859375, -0.64984130859375, -0.5968017578125, -0.54376220703125, -0.49072265625, -0.43768310546875, -0.3846435546875, -0.33160400390625, -0.278564453125, -0.22552490234375, -0.1724853515625, -0.11944580078125, -0.06640625, -0.01336669921875, 0.0396728515625, 0.09271240234375, 0.145751953125, 0.19879150390625, 0.2518310546875, 0.30487060546875, 0.35791015625, 0.41094970703125, 0.4639892578125, 0.51702880859375, 0.570068359375, 0.62310791015625, 0.6761474609375, 0.72918701171875, 0.7822265625, 0.83526611328125, 0.8883056640625, 0.94134521484375, 0.994384765625, 1.04742431640625, 1.1004638671875, 1.15350341796875, 1.20654296875, 1.25958251953125, 1.3126220703125, 1.36566162109375, 1.418701171875, 1.47174072265625, 1.5247802734375, 1.57781982421875, 1.630859375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 13.0, 16.0, 39.0, 55.0, 69.0, 67.0, 93.0, 114.0, 97.0, 118.0, 75.0, 69.0, 47.0, 37.0, 39.0, 14.0, 11.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.25766563415527344, -0.2509269714355469, -0.2441883087158203, -0.23744964599609375, -0.2307109832763672, -0.22397232055664062, -0.21723365783691406, -0.2104949951171875, -0.20375633239746094, -0.19701766967773438, -0.1902790069580078, -0.18354034423828125, -0.1768016815185547, -0.17006301879882812, -0.16332435607910156, -0.156585693359375, -0.14984703063964844, -0.14310836791992188, -0.1363697052001953, -0.12963104248046875, -0.12289237976074219, -0.11615371704101562, -0.10941505432128906, -0.1026763916015625, -0.09593772888183594, -0.08919906616210938, -0.08246040344238281, -0.07572174072265625, -0.06898307800292969, -0.062244415283203125, -0.05550575256347656, -0.04876708984375, -0.04202842712402344, -0.035289764404296875, -0.028551101684570312, -0.02181243896484375, -0.015073776245117188, -0.008335113525390625, -0.0015964508056640625, 0.0051422119140625, 0.011880874633789062, 0.018619537353515625, 0.025358200073242188, 0.03209686279296875, 0.03883552551269531, 0.045574188232421875, 0.05231285095214844, 0.059051513671875, 0.06579017639160156, 0.07252883911132812, 0.07926750183105469, 0.08600616455078125, 0.09274482727050781, 0.09948348999023438, 0.10622215270996094, 0.1129608154296875, 0.11969947814941406, 0.12643814086914062, 0.1331768035888672, 0.13991546630859375, 0.1466541290283203, 0.15339279174804688, 0.16013145446777344, 0.1668701171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 4.0, 9.0, 15.0, 14.0, 11.0, 19.0, 34.0, 35.0, 46.0, 70.0, 110.0, 146.0, 208.0, 355.0, 598.0, 1084.0, 2602.0, 7035.0, 23461.0, 89649.0, 324858.0, 411001.0, 135891.0, 34574.0, 9980.0, 3304.0, 1447.0, 681.0, 404.0, 257.0, 196.0, 126.0, 94.0, 65.0, 37.0, 47.0, 23.0, 13.0, 11.0, 9.0, 7.0, 8.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6533203125, -0.6323471069335938, -0.6113739013671875, -0.5904006958007812, -0.569427490234375, -0.5484542846679688, -0.5274810791015625, -0.5065078735351562, -0.48553466796875, -0.46456146240234375, -0.4435882568359375, -0.42261505126953125, -0.401641845703125, -0.38066864013671875, -0.3596954345703125, -0.33872222900390625, -0.3177490234375, -0.29677581787109375, -0.2758026123046875, -0.25482940673828125, -0.233856201171875, -0.21288299560546875, -0.1919097900390625, -0.17093658447265625, -0.14996337890625, -0.12899017333984375, -0.1080169677734375, -0.08704376220703125, -0.066070556640625, -0.04509735107421875, -0.0241241455078125, -0.00315093994140625, 0.017822265625, 0.03879547119140625, 0.0597686767578125, 0.08074188232421875, 0.101715087890625, 0.12268829345703125, 0.1436614990234375, 0.16463470458984375, 0.18560791015625, 0.20658111572265625, 0.2275543212890625, 0.24852752685546875, 0.269500732421875, 0.29047393798828125, 0.3114471435546875, 0.33242034912109375, 0.3533935546875, 0.37436676025390625, 0.3953399658203125, 0.41631317138671875, 0.437286376953125, 0.45825958251953125, 0.4792327880859375, 0.5002059936523438, 0.52117919921875, 0.5421524047851562, 0.5631256103515625, 0.5840988159179688, 0.605072021484375, 0.6260452270507812, 0.6470184326171875, 0.6679916381835938, 0.68896484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 14.0, 25.0, 24.0, 26.0, 28.0, 37.0, 39.0, 45.0, 35.0, 51.0, 44.0, 44.0, 64.0, 45.0, 64.0, 47.0, 37.0, 43.0, 29.0, 48.0, 28.0, 32.0, 23.0, 22.0, 16.0, 19.0, 12.0, 8.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.474365234375, -0.4579505920410156, -0.44153594970703125, -0.4251213073730469, -0.4087066650390625, -0.3922920227050781, -0.37587738037109375, -0.3594627380371094, -0.343048095703125, -0.3266334533691406, -0.31021881103515625, -0.2938041687011719, -0.2773895263671875, -0.2609748840332031, -0.24456024169921875, -0.22814559936523438, -0.21173095703125, -0.19531631469726562, -0.17890167236328125, -0.16248703002929688, -0.1460723876953125, -0.12965774536132812, -0.11324310302734375, -0.09682846069335938, -0.080413818359375, -0.06399917602539062, -0.04758453369140625, -0.031169891357421875, -0.0147552490234375, 0.001659393310546875, 0.01807403564453125, 0.034488677978515625, 0.0509033203125, 0.06731796264648438, 0.08373260498046875, 0.10014724731445312, 0.1165618896484375, 0.13297653198242188, 0.14939117431640625, 0.16580581665039062, 0.182220458984375, 0.19863510131835938, 0.21504974365234375, 0.23146438598632812, 0.2478790283203125, 0.2642936706542969, 0.28070831298828125, 0.2971229553222656, 0.31353759765625, 0.3299522399902344, 0.34636688232421875, 0.3627815246582031, 0.3791961669921875, 0.3956108093261719, 0.41202545166015625, 0.4284400939941406, 0.444854736328125, 0.4612693786621094, 0.47768402099609375, 0.4940986633300781, 0.5105133056640625, 0.5269279479980469, 0.5433425903320312, 0.5597572326660156, 0.576171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 6.0, 10.0, 11.0, 17.0, 17.0, 53.0, 59.0, 100.0, 189.0, 264.0, 495.0, 956.0, 2007.0, 4832.0, 13599.0, 46829.0, 181553.0, 429887.0, 264842.0, 71769.0, 19240.0, 6529.0, 2555.0, 1259.0, 596.0, 357.0, 195.0, 102.0, 77.0, 48.0, 27.0, 18.0, 14.0, 7.0, 5.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2615394592285156, -0.25208282470703125, -0.24262619018554688, -0.2331695556640625, -0.22371292114257812, -0.21425628662109375, -0.20479965209960938, -0.195343017578125, -0.18588638305664062, -0.17642974853515625, -0.16697311401367188, -0.1575164794921875, -0.14805984497070312, -0.13860321044921875, -0.12914657592773438, -0.11968994140625, -0.11023330688476562, -0.10077667236328125, -0.09132003784179688, -0.0818634033203125, -0.07240676879882812, -0.06295013427734375, -0.053493499755859375, -0.044036865234375, -0.034580230712890625, -0.02512359619140625, -0.015666961669921875, -0.0062103271484375, 0.003246307373046875, 0.01270294189453125, 0.022159576416015625, 0.0316162109375, 0.041072845458984375, 0.05052947998046875, 0.059986114501953125, 0.0694427490234375, 0.07889938354492188, 0.08835601806640625, 0.09781265258789062, 0.107269287109375, 0.11672592163085938, 0.12618255615234375, 0.13563919067382812, 0.1450958251953125, 0.15455245971679688, 0.16400909423828125, 0.17346572875976562, 0.18292236328125, 0.19237899780273438, 0.20183563232421875, 0.21129226684570312, 0.2207489013671875, 0.23020553588867188, 0.23966217041015625, 0.24911880493164062, 0.258575439453125, 0.2680320739746094, 0.27748870849609375, 0.2869453430175781, 0.2964019775390625, 0.3058586120605469, 0.31531524658203125, 0.3247718811035156, 0.334228515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 2.0, 1.0, 1.0, 3.0, 9.0, 7.0, 8.0, 10.0, 4.0, 7.0, 13.0, 8.0, 12.0, 15.0, 20.0, 30.0, 32.0, 53.0, 55.0, 66.0, 61.0, 68.0, 79.0, 91.0, 70.0, 46.0, 35.0, 31.0, 24.0, 23.0, 17.0, 24.0, 10.0, 10.0, 5.0, 7.0, 7.0, 8.0, 7.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.547306060791016e-05, -8.297152817249298e-05, -8.04699957370758e-05, -7.796846330165863e-05, -7.546693086624146e-05, -7.296539843082428e-05, -7.04638659954071e-05, -6.796233355998993e-05, -6.546080112457275e-05, -6.295926868915558e-05, -6.04577362537384e-05, -5.795620381832123e-05, -5.545467138290405e-05, -5.295313894748688e-05, -5.04516065120697e-05, -4.795007407665253e-05, -4.544854164123535e-05, -4.2947009205818176e-05, -4.0445476770401e-05, -3.7943944334983826e-05, -3.544241189956665e-05, -3.2940879464149475e-05, -3.04393470287323e-05, -2.7937814593315125e-05, -2.543628215789795e-05, -2.2934749722480774e-05, -2.04332172870636e-05, -1.7931684851646423e-05, -1.5430152416229248e-05, -1.2928619980812073e-05, -1.0427087545394897e-05, -7.925555109977722e-06, -5.424022674560547e-06, -2.9224902391433716e-06, -4.209578037261963e-07, 2.080574631690979e-06, 4.582107067108154e-06, 7.08363950252533e-06, 9.585171937942505e-06, 1.208670437335968e-05, 1.4588236808776855e-05, 1.708976924419403e-05, 1.9591301679611206e-05, 2.209283411502838e-05, 2.4594366550445557e-05, 2.7095898985862732e-05, 2.9597431421279907e-05, 3.209896385669708e-05, 3.460049629211426e-05, 3.710202872753143e-05, 3.960356116294861e-05, 4.2105093598365784e-05, 4.460662603378296e-05, 4.7108158469200134e-05, 4.960969090461731e-05, 5.2111223340034485e-05, 5.461275577545166e-05, 5.7114288210868835e-05, 5.961582064628601e-05, 6.211735308170319e-05, 6.461888551712036e-05, 6.712041795253754e-05, 6.962195038795471e-05, 7.212348282337189e-05, 7.462501525878906e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 2.0, 6.0, 11.0, 11.0, 18.0, 29.0, 32.0, 60.0, 75.0, 130.0, 180.0, 335.0, 558.0, 1227.0, 2825.0, 9017.0, 38178.0, 204187.0, 519927.0, 215845.0, 40807.0, 9389.0, 2976.0, 1254.0, 595.0, 300.0, 208.0, 109.0, 76.0, 48.0, 45.0, 27.0, 13.0, 13.0, 7.0, 10.0, 2.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.341064453125, -0.3295097351074219, -0.31795501708984375, -0.3064002990722656, -0.2948455810546875, -0.2832908630371094, -0.27173614501953125, -0.2601814270019531, -0.248626708984375, -0.23707199096679688, -0.22551727294921875, -0.21396255493164062, -0.2024078369140625, -0.19085311889648438, -0.17929840087890625, -0.16774368286132812, -0.15618896484375, -0.14463424682617188, -0.13307952880859375, -0.12152481079101562, -0.1099700927734375, -0.09841537475585938, -0.08686065673828125, -0.07530593872070312, -0.063751220703125, -0.052196502685546875, -0.04064178466796875, -0.029087066650390625, -0.0175323486328125, -0.005977630615234375, 0.00557708740234375, 0.017131805419921875, 0.0286865234375, 0.040241241455078125, 0.05179595947265625, 0.06335067749023438, 0.0749053955078125, 0.08646011352539062, 0.09801483154296875, 0.10956954956054688, 0.121124267578125, 0.13267898559570312, 0.14423370361328125, 0.15578842163085938, 0.1673431396484375, 0.17889785766601562, 0.19045257568359375, 0.20200729370117188, 0.21356201171875, 0.22511672973632812, 0.23667144775390625, 0.24822616577148438, 0.2597808837890625, 0.2713356018066406, 0.28289031982421875, 0.2944450378417969, 0.305999755859375, 0.3175544738769531, 0.32910919189453125, 0.3406639099121094, 0.3522186279296875, 0.3637733459472656, 0.37532806396484375, 0.3868827819824219, 0.3984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 10.0, 9.0, 17.0, 18.0, 22.0, 35.0, 62.0, 47.0, 69.0, 80.0, 92.0, 101.0, 82.0, 72.0, 71.0, 62.0, 46.0, 31.0, 23.0, 18.0, 8.0, 12.0, 11.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.46923828125, -0.4588775634765625, -0.448516845703125, -0.4381561279296875, -0.42779541015625, -0.4174346923828125, -0.407073974609375, -0.3967132568359375, -0.3863525390625, -0.3759918212890625, -0.365631103515625, -0.3552703857421875, -0.34490966796875, -0.3345489501953125, -0.324188232421875, -0.3138275146484375, -0.303466796875, -0.2931060791015625, -0.282745361328125, -0.2723846435546875, -0.26202392578125, -0.2516632080078125, -0.241302490234375, -0.2309417724609375, -0.2205810546875, -0.2102203369140625, -0.199859619140625, -0.1894989013671875, -0.17913818359375, -0.1687774658203125, -0.158416748046875, -0.1480560302734375, -0.1376953125, -0.1273345947265625, -0.116973876953125, -0.1066131591796875, -0.09625244140625, -0.0858917236328125, -0.075531005859375, -0.0651702880859375, -0.0548095703125, -0.0444488525390625, -0.034088134765625, -0.0237274169921875, -0.01336669921875, -0.0030059814453125, 0.007354736328125, 0.0177154541015625, 0.028076171875, 0.0384368896484375, 0.048797607421875, 0.0591583251953125, 0.06951904296875, 0.0798797607421875, 0.090240478515625, 0.1006011962890625, 0.1109619140625, 0.1213226318359375, 0.131683349609375, 0.1420440673828125, 0.15240478515625, 0.1627655029296875, 0.173126220703125, 0.1834869384765625, 0.19384765625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 11.0, 23.0, 30.0, 61.0, 97.0, 140.0, 148.0, 163.0, 108.0, 96.0, 60.0, 25.0, 16.0, 10.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.731440544128418, -4.548333168029785, -4.3652262687683105, -4.182119369506836, -3.999011993408203, -3.8159048557281494, -3.6327977180480957, -3.449690580368042, -3.2665834426879883, -3.0834763050079346, -2.900369167327881, -2.717262029647827, -2.5341548919677734, -2.3510477542877197, -2.167940616607666, -1.9848334789276123, -1.8017263412475586, -1.6186192035675049, -1.4355120658874512, -1.2524049282073975, -1.0692977905273438, -0.88619065284729, -0.7030835151672363, -0.5199763774871826, -0.3368692398071289, -0.1537621021270752, 0.029345035552978516, 0.21245217323303223, 0.39555931091308594, 0.5786664485931396, 0.7617735862731934, 0.9448807239532471, 1.127988338470459, 1.3110954761505127, 1.4942026138305664, 1.6773097515106201, 1.8604168891906738, 2.0435240268707275, 2.2266311645507812, 2.409738302230835, 2.5928454399108887, 2.7759525775909424, 2.959059715270996, 3.14216685295105, 3.3252739906311035, 3.5083811283111572, 3.691488265991211, 3.8745954036712646, 4.057702541351318, 4.240809440612793, 4.423916816711426, 4.607024192810059, 4.790131092071533, 4.973237991333008, 5.156345367431641, 5.339452743530273, 5.522559642791748, 5.705666542053223, 5.8887739181518555, 6.071881294250488, 6.254988193511963, 6.4380950927734375, 6.62120246887207, 6.804309844970703, 6.987416744232178]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 2.0, 6.0, 4.0, 10.0, 9.0, 14.0, 16.0, 22.0, 19.0, 14.0, 23.0, 27.0, 28.0, 36.0, 55.0, 46.0, 39.0, 48.0, 35.0, 49.0, 47.0, 50.0, 56.0, 39.0, 61.0, 38.0, 28.0, 28.0, 28.0, 28.0, 17.0, 14.0, 13.0, 12.0, 3.0, 9.0, 8.0, 6.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8268818855285645, -2.734602451324463, -2.6423230171203613, -2.5500435829162598, -2.457764148712158, -2.3654849529266357, -2.273205518722534, -2.1809260845184326, -2.088646650314331, -1.9963672161102295, -1.904087781906128, -1.811808466911316, -1.7195290327072144, -1.6272495985031128, -1.5349702835083008, -1.4426908493041992, -1.3504114151000977, -1.258131980895996, -1.1658525466918945, -1.0735732316970825, -0.981293797492981, -0.8890143632888794, -0.7967349886894226, -0.7044556140899658, -0.6121761798858643, -0.5198967456817627, -0.4276173710823059, -0.33533796668052673, -0.24305856227874756, -0.15077915787696838, -0.05849975347518921, 0.03377962112426758, 0.12605905532836914, 0.21833845973014832, 0.3106178641319275, 0.40289726853370667, 0.49517667293548584, 0.5874561071395874, 0.6797354817390442, 0.772014856338501, 0.8642942905426025, 0.9565737247467041, 1.0488531589508057, 1.1411324739456177, 1.2334119081497192, 1.3256913423538208, 1.4179706573486328, 1.5102500915527344, 1.602529525756836, 1.6948089599609375, 1.787088394165039, 1.879367709159851, 1.9716471433639526, 2.0639264583587646, 2.156205892562866, 2.2484853267669678, 2.3407647609710693, 2.433044195175171, 2.5253236293792725, 2.617603063583374, 2.7098822593688965, 2.802161693572998, 2.8944411277770996, 2.986720561981201, 3.0789999961853027]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 9.0, 12.0, 11.0, 12.0, 22.0, 23.0, 35.0, 34.0, 50.0, 81.0, 94.0, 172.0, 222.0, 379.0, 703.0, 1564.0, 5188.0, 35809.0, 2444908.0, 1662321.0, 33675.0, 5259.0, 1711.0, 783.0, 438.0, 238.0, 177.0, 102.0, 73.0, 43.0, 41.0, 21.0, 20.0, 14.0, 10.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.1875, -2.123138427734375, -2.05877685546875, -1.994415283203125, -1.9300537109375, -1.865692138671875, -1.80133056640625, -1.736968994140625, -1.672607421875, -1.608245849609375, -1.54388427734375, -1.479522705078125, -1.4151611328125, -1.350799560546875, -1.28643798828125, -1.222076416015625, -1.15771484375, -1.093353271484375, -1.02899169921875, -0.964630126953125, -0.9002685546875, -0.835906982421875, -0.77154541015625, -0.707183837890625, -0.642822265625, -0.578460693359375, -0.51409912109375, -0.449737548828125, -0.3853759765625, -0.321014404296875, -0.25665283203125, -0.192291259765625, -0.1279296875, -0.063568115234375, 0.00079345703125, 0.065155029296875, 0.1295166015625, 0.193878173828125, 0.25823974609375, 0.322601318359375, 0.386962890625, 0.451324462890625, 0.51568603515625, 0.580047607421875, 0.6444091796875, 0.708770751953125, 0.77313232421875, 0.837493896484375, 0.90185546875, 0.966217041015625, 1.03057861328125, 1.094940185546875, 1.1593017578125, 1.223663330078125, 1.28802490234375, 1.352386474609375, 1.416748046875, 1.481109619140625, 1.54547119140625, 1.609832763671875, 1.6741943359375, 1.738555908203125, 1.80291748046875, 1.867279052734375, 1.931640625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 22.0, 43.0, 58.0, 64.0, 72.0, 80.0, 98.0, 110.0, 96.0, 84.0, 60.0, 65.0, 38.0, 26.0, 22.0, 11.0, 6.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.27734375, -0.27045631408691406, -0.2635688781738281, -0.2566814422607422, -0.24979400634765625, -0.2429065704345703, -0.23601913452148438, -0.22913169860839844, -0.2222442626953125, -0.21535682678222656, -0.20846939086914062, -0.2015819549560547, -0.19469451904296875, -0.1878070831298828, -0.18091964721679688, -0.17403221130371094, -0.167144775390625, -0.16025733947753906, -0.15336990356445312, -0.1464824676513672, -0.13959503173828125, -0.1327075958251953, -0.12582015991210938, -0.11893272399902344, -0.1120452880859375, -0.10515785217285156, -0.09827041625976562, -0.09138298034667969, -0.08449554443359375, -0.07760810852050781, -0.07072067260742188, -0.06383323669433594, -0.05694580078125, -0.05005836486816406, -0.043170928955078125, -0.03628349304199219, -0.02939605712890625, -0.022508621215820312, -0.015621185302734375, -0.008733749389648438, -0.0018463134765625, 0.0050411224365234375, 0.011928558349609375, 0.018815994262695312, 0.02570343017578125, 0.03259086608886719, 0.039478302001953125, 0.04636573791503906, 0.053253173828125, 0.06014060974121094, 0.06702804565429688, 0.07391548156738281, 0.08080291748046875, 0.08769035339355469, 0.09457778930664062, 0.10146522521972656, 0.1083526611328125, 0.11524009704589844, 0.12212753295898438, 0.1290149688720703, 0.13590240478515625, 0.1427898406982422, 0.14967727661132812, 0.15656471252441406, 0.1634521484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 7.0, 13.0, 18.0, 21.0, 32.0, 55.0, 112.0, 232.0, 518.0, 1344.0, 3755.0, 15786.0, 118680.0, 3552209.0, 455872.0, 35402.0, 6814.0, 2017.0, 747.0, 317.0, 154.0, 81.0, 39.0, 22.0, 9.0, 9.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.45703125, -1.415069580078125, -1.37310791015625, -1.331146240234375, -1.2891845703125, -1.247222900390625, -1.20526123046875, -1.163299560546875, -1.121337890625, -1.079376220703125, -1.03741455078125, -0.995452880859375, -0.9534912109375, -0.911529541015625, -0.86956787109375, -0.827606201171875, -0.78564453125, -0.743682861328125, -0.70172119140625, -0.659759521484375, -0.6177978515625, -0.575836181640625, -0.53387451171875, -0.491912841796875, -0.449951171875, -0.407989501953125, -0.36602783203125, -0.324066162109375, -0.2821044921875, -0.240142822265625, -0.19818115234375, -0.156219482421875, -0.1142578125, -0.072296142578125, -0.03033447265625, 0.011627197265625, 0.0535888671875, 0.095550537109375, 0.13751220703125, 0.179473876953125, 0.221435546875, 0.263397216796875, 0.30535888671875, 0.347320556640625, 0.3892822265625, 0.431243896484375, 0.47320556640625, 0.515167236328125, 0.55712890625, 0.599090576171875, 0.64105224609375, 0.683013916015625, 0.7249755859375, 0.766937255859375, 0.80889892578125, 0.850860595703125, 0.892822265625, 0.934783935546875, 0.97674560546875, 1.018707275390625, 1.0606689453125, 1.102630615234375, 1.14459228515625, 1.186553955078125, 1.228515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 7.0, 18.0, 21.0, 23.0, 28.0, 47.0, 55.0, 80.0, 155.0, 250.0, 509.0, 1282.0, 699.0, 328.0, 176.0, 133.0, 77.0, 58.0, 35.0, 26.0, 13.0, 8.0, 12.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381591796875, -0.3699188232421875, -0.358245849609375, -0.3465728759765625, -0.33489990234375, -0.3232269287109375, -0.311553955078125, -0.2998809814453125, -0.2882080078125, -0.2765350341796875, -0.264862060546875, -0.2531890869140625, -0.24151611328125, -0.2298431396484375, -0.218170166015625, -0.2064971923828125, -0.19482421875, -0.1831512451171875, -0.171478271484375, -0.1598052978515625, -0.14813232421875, -0.1364593505859375, -0.124786376953125, -0.1131134033203125, -0.1014404296875, -0.0897674560546875, -0.078094482421875, -0.0664215087890625, -0.05474853515625, -0.0430755615234375, -0.031402587890625, -0.0197296142578125, -0.008056640625, 0.0036163330078125, 0.015289306640625, 0.0269622802734375, 0.03863525390625, 0.0503082275390625, 0.061981201171875, 0.0736541748046875, 0.0853271484375, 0.0970001220703125, 0.108673095703125, 0.1203460693359375, 0.13201904296875, 0.1436920166015625, 0.155364990234375, 0.1670379638671875, 0.1787109375, 0.1903839111328125, 0.202056884765625, 0.2137298583984375, 0.22540283203125, 0.2370758056640625, 0.248748779296875, 0.2604217529296875, 0.2720947265625, 0.2837677001953125, 0.295440673828125, 0.3071136474609375, 0.31878662109375, 0.3304595947265625, 0.342132568359375, 0.3538055419921875, 0.365478515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 12.0, 19.0, 27.0, 68.0, 125.0, 200.0, 195.0, 174.0, 87.0, 50.0, 22.0, 11.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.545332670211792, -1.4198428392410278, -1.2943530082702637, -1.1688631772994995, -1.0433733463287354, -0.9178835153579712, -0.792393684387207, -0.6669038534164429, -0.5414140224456787, -0.41592419147491455, -0.2904343605041504, -0.16494452953338623, -0.03945469856262207, 0.08603513240814209, 0.21152496337890625, 0.3370147943496704, 0.46250462532043457, 0.5879944562911987, 0.7134842872619629, 0.838974118232727, 0.9644639492034912, 1.0899537801742554, 1.2154436111450195, 1.3409334421157837, 1.4664232730865479, 1.591913104057312, 1.7174029350280762, 1.8428927659988403, 1.9683825969696045, 2.093872547149658, 2.219362258911133, 2.3448519706726074, 2.4703421592712402, 2.595831871032715, 2.7213218212127686, 2.8468117713928223, 2.972301483154297, 3.0977911949157715, 3.223281145095825, 3.348771095275879, 3.4742608070373535, 3.599750518798828, 3.725240468978882, 3.8507304191589355, 3.97622013092041, 4.101709842681885, 4.227199554443359, 4.352689743041992, 4.478179454803467, 4.603669166564941, 4.729159355163574, 4.854649066925049, 4.980138778686523, 5.105628490447998, 5.231118202209473, 5.3566083908081055, 5.48209810256958, 5.607587814331055, 5.7330780029296875, 5.858567714691162, 5.984057426452637, 6.109547138214111, 6.235036849975586, 6.360527038574219, 6.486016750335693]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 5.0, 6.0, 6.0, 7.0, 11.0, 8.0, 11.0, 18.0, 27.0, 16.0, 28.0, 28.0, 33.0, 37.0, 52.0, 49.0, 34.0, 36.0, 49.0, 38.0, 54.0, 41.0, 40.0, 44.0, 42.0, 43.0, 26.0, 39.0, 28.0, 23.0, 17.0, 23.0, 20.0, 11.0, 11.0, 6.0, 5.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2867462635040283, -1.2483692169189453, -1.2099921703338623, -1.1716152429580688, -1.1332381963729858, -1.0948611497879028, -1.0564841032028198, -1.0181070566177368, -0.9797300696372986, -0.9413530230522156, -0.9029760360717773, -0.8645989894866943, -0.8262219429016113, -0.7878449559211731, -0.7494679093360901, -0.7110909223556519, -0.6727138757705688, -0.6343368291854858, -0.5959598422050476, -0.5575827956199646, -0.5192058086395264, -0.48082876205444336, -0.44245171546936035, -0.40407469868659973, -0.3656976819038391, -0.3273206651210785, -0.28894364833831787, -0.25056660175323486, -0.21218958497047424, -0.17381256818771362, -0.1354355365037918, -0.09705850481987, -0.058681488037109375, -0.020304463803768158, 0.01807256042957306, 0.056449584662914276, 0.0948266088962555, 0.1332036256790161, 0.17158065736293793, 0.20995768904685974, 0.24833470582962036, 0.286711722612381, 0.3250887393951416, 0.3634657859802246, 0.40184280276298523, 0.44021981954574585, 0.47859686613082886, 0.5169738531112671, 0.5553508996963501, 0.5937279462814331, 0.6321049332618713, 0.6704819798469543, 0.7088589668273926, 0.7472360134124756, 0.7856130599975586, 0.8239901065826416, 0.8623670935630798, 0.9007441401481628, 0.9391211271286011, 0.9774981737136841, 1.015875220298767, 1.0542521476745605, 1.0926291942596436, 1.1310062408447266, 1.1693832874298096]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 10.0, 13.0, 11.0, 25.0, 23.0, 48.0, 63.0, 83.0, 181.0, 294.0, 643.0, 1666.0, 6687.0, 55763.0, 726125.0, 235078.0, 16691.0, 3144.0, 1002.0, 386.0, 232.0, 133.0, 64.0, 51.0, 37.0, 29.0, 11.0, 13.0, 14.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.458984375, -1.39483642578125, -1.3306884765625, -1.26654052734375, -1.202392578125, -1.13824462890625, -1.0740966796875, -1.00994873046875, -0.94580078125, -0.88165283203125, -0.8175048828125, -0.75335693359375, -0.689208984375, -0.62506103515625, -0.5609130859375, -0.49676513671875, -0.4326171875, -0.36846923828125, -0.3043212890625, -0.24017333984375, -0.176025390625, -0.11187744140625, -0.0477294921875, 0.01641845703125, 0.08056640625, 0.14471435546875, 0.2088623046875, 0.27301025390625, 0.337158203125, 0.40130615234375, 0.4654541015625, 0.52960205078125, 0.59375, 0.65789794921875, 0.7220458984375, 0.78619384765625, 0.850341796875, 0.91448974609375, 0.9786376953125, 1.04278564453125, 1.10693359375, 1.17108154296875, 1.2352294921875, 1.29937744140625, 1.363525390625, 1.42767333984375, 1.4918212890625, 1.55596923828125, 1.6201171875, 1.68426513671875, 1.7484130859375, 1.81256103515625, 1.876708984375, 1.94085693359375, 2.0050048828125, 2.06915283203125, 2.13330078125, 2.19744873046875, 2.2615966796875, 2.32574462890625, 2.389892578125, 2.45404052734375, 2.5181884765625, 2.58233642578125, 2.646484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 17.0, 18.0, 23.0, 39.0, 49.0, 58.0, 65.0, 110.0, 90.0, 92.0, 76.0, 95.0, 65.0, 55.0, 44.0, 31.0, 17.0, 17.0, 13.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281982421875, -0.27482032775878906, -0.2676582336425781, -0.2604961395263672, -0.25333404541015625, -0.2461719512939453, -0.23900985717773438, -0.23184776306152344, -0.2246856689453125, -0.21752357482910156, -0.21036148071289062, -0.2031993865966797, -0.19603729248046875, -0.1888751983642578, -0.18171310424804688, -0.17455101013183594, -0.167388916015625, -0.16022682189941406, -0.15306472778320312, -0.1459026336669922, -0.13874053955078125, -0.1315784454345703, -0.12441635131835938, -0.11725425720214844, -0.1100921630859375, -0.10293006896972656, -0.09576797485351562, -0.08860588073730469, -0.08144378662109375, -0.07428169250488281, -0.06711959838867188, -0.05995750427246094, -0.05279541015625, -0.04563331604003906, -0.038471221923828125, -0.03130912780761719, -0.02414703369140625, -0.016984939575195312, -0.009822845458984375, -0.0026607513427734375, 0.0045013427734375, 0.011663436889648438, 0.018825531005859375, 0.025987625122070312, 0.03314971923828125, 0.04031181335449219, 0.047473907470703125, 0.05463600158691406, 0.061798095703125, 0.06896018981933594, 0.07612228393554688, 0.08328437805175781, 0.09044647216796875, 0.09760856628417969, 0.10477066040039062, 0.11193275451660156, 0.1190948486328125, 0.12625694274902344, 0.13341903686523438, 0.1405811309814453, 0.14774322509765625, 0.1549053192138672, 0.16206741333007812, 0.16922950744628906, 0.1763916015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 6.0, 5.0, 11.0, 10.0, 19.0, 27.0, 16.0, 36.0, 58.0, 53.0, 62.0, 100.0, 142.0, 182.0, 353.0, 657.0, 1232.0, 2822.0, 8303.0, 29914.0, 125870.0, 433548.0, 332706.0, 81751.0, 19893.0, 6043.0, 2190.0, 943.0, 529.0, 319.0, 218.0, 109.0, 95.0, 85.0, 47.0, 43.0, 36.0, 23.0, 13.0, 18.0, 11.0, 12.0, 7.0, 10.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.76123046875, -0.7365570068359375, -0.711883544921875, -0.6872100830078125, -0.66253662109375, -0.6378631591796875, -0.613189697265625, -0.5885162353515625, -0.5638427734375, -0.5391693115234375, -0.514495849609375, -0.4898223876953125, -0.46514892578125, -0.4404754638671875, -0.415802001953125, -0.3911285400390625, -0.366455078125, -0.3417816162109375, -0.317108154296875, -0.2924346923828125, -0.26776123046875, -0.2430877685546875, -0.218414306640625, -0.1937408447265625, -0.1690673828125, -0.1443939208984375, -0.119720458984375, -0.0950469970703125, -0.07037353515625, -0.0457000732421875, -0.021026611328125, 0.0036468505859375, 0.0283203125, 0.0529937744140625, 0.077667236328125, 0.1023406982421875, 0.12701416015625, 0.1516876220703125, 0.176361083984375, 0.2010345458984375, 0.2257080078125, 0.2503814697265625, 0.275054931640625, 0.2997283935546875, 0.32440185546875, 0.3490753173828125, 0.373748779296875, 0.3984222412109375, 0.423095703125, 0.4477691650390625, 0.472442626953125, 0.4971160888671875, 0.52178955078125, 0.5464630126953125, 0.571136474609375, 0.5958099365234375, 0.6204833984375, 0.6451568603515625, 0.669830322265625, 0.6945037841796875, 0.71917724609375, 0.7438507080078125, 0.768524169921875, 0.7931976318359375, 0.81787109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 12.0, 16.0, 10.0, 8.0, 15.0, 20.0, 30.0, 32.0, 27.0, 42.0, 43.0, 42.0, 52.0, 34.0, 41.0, 47.0, 40.0, 49.0, 38.0, 45.0, 45.0, 30.0, 36.0, 37.0, 42.0, 22.0, 18.0, 22.0, 13.0, 20.0, 12.0, 12.0, 11.0, 9.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.476806640625, -0.4592247009277344, -0.44164276123046875, -0.4240608215332031, -0.4064788818359375, -0.3888969421386719, -0.37131500244140625, -0.3537330627441406, -0.336151123046875, -0.3185691833496094, -0.30098724365234375, -0.2834053039550781, -0.2658233642578125, -0.24824142456054688, -0.23065948486328125, -0.21307754516601562, -0.19549560546875, -0.17791366577148438, -0.16033172607421875, -0.14274978637695312, -0.1251678466796875, -0.10758590698242188, -0.09000396728515625, -0.07242202758789062, -0.054840087890625, -0.037258148193359375, -0.01967620849609375, -0.002094268798828125, 0.0154876708984375, 0.033069610595703125, 0.05065155029296875, 0.06823348999023438, 0.0858154296875, 0.10339736938476562, 0.12097930908203125, 0.13856124877929688, 0.1561431884765625, 0.17372512817382812, 0.19130706787109375, 0.20888900756835938, 0.226470947265625, 0.24405288696289062, 0.26163482666015625, 0.2792167663574219, 0.2967987060546875, 0.3143806457519531, 0.33196258544921875, 0.3495445251464844, 0.36712646484375, 0.3847084045410156, 0.40229034423828125, 0.4198722839355469, 0.4374542236328125, 0.4550361633300781, 0.47261810302734375, 0.4902000427246094, 0.507781982421875, 0.5253639221191406, 0.5429458618164062, 0.5605278015136719, 0.5781097412109375, 0.5956916809082031, 0.6132736206054688, 0.6308555603027344, 0.6484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 10.0, 8.0, 12.0, 32.0, 25.0, 59.0, 92.0, 187.0, 334.0, 659.0, 2046.0, 9882.0, 142499.0, 815237.0, 68274.0, 6363.0, 1599.0, 551.0, 277.0, 138.0, 98.0, 59.0, 28.0, 23.0, 10.0, 8.0, 9.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.732421875, -0.7046661376953125, -0.676910400390625, -0.6491546630859375, -0.62139892578125, -0.5936431884765625, -0.565887451171875, -0.5381317138671875, -0.5103759765625, -0.4826202392578125, -0.454864501953125, -0.4271087646484375, -0.39935302734375, -0.3715972900390625, -0.343841552734375, -0.3160858154296875, -0.288330078125, -0.2605743408203125, -0.232818603515625, -0.2050628662109375, -0.17730712890625, -0.1495513916015625, -0.121795654296875, -0.0940399169921875, -0.0662841796875, -0.0385284423828125, -0.010772705078125, 0.0169830322265625, 0.04473876953125, 0.0724945068359375, 0.100250244140625, 0.1280059814453125, 0.15576171875, 0.1835174560546875, 0.211273193359375, 0.2390289306640625, 0.26678466796875, 0.2945404052734375, 0.322296142578125, 0.3500518798828125, 0.3778076171875, 0.4055633544921875, 0.433319091796875, 0.4610748291015625, 0.48883056640625, 0.5165863037109375, 0.544342041015625, 0.5720977783203125, 0.599853515625, 0.6276092529296875, 0.655364990234375, 0.6831207275390625, 0.71087646484375, 0.7386322021484375, 0.766387939453125, 0.7941436767578125, 0.8218994140625, 0.8496551513671875, 0.877410888671875, 0.9051666259765625, 0.93292236328125, 0.9606781005859375, 0.988433837890625, 1.0161895751953125, 1.0439453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 13.0, 13.0, 16.0, 38.0, 75.0, 194.0, 333.0, 180.0, 90.0, 29.0, 17.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00063323974609375, -0.0006211623549461365, -0.000609084963798523, -0.0005970075726509094, -0.0005849301815032959, -0.0005728527903556824, -0.0005607753992080688, -0.0005486980080604553, -0.0005366206169128418, -0.0005245432257652283, -0.0005124658346176147, -0.0005003884434700012, -0.0004883110523223877, -0.00047623366117477417, -0.00046415627002716064, -0.0004520788788795471, -0.0004400014877319336, -0.00042792409658432007, -0.00041584670543670654, -0.000403769314289093, -0.0003916919231414795, -0.00037961453199386597, -0.00036753714084625244, -0.0003554597496986389, -0.0003433823585510254, -0.00033130496740341187, -0.00031922757625579834, -0.0003071501851081848, -0.0002950727939605713, -0.00028299540281295776, -0.00027091801166534424, -0.0002588406205177307, -0.0002467632293701172, -0.00023468583822250366, -0.00022260844707489014, -0.0002105310559272766, -0.00019845366477966309, -0.00018637627363204956, -0.00017429888248443604, -0.0001622214913368225, -0.00015014410018920898, -0.00013806670904159546, -0.00012598931789398193, -0.00011391192674636841, -0.00010183453559875488, -8.975714445114136e-05, -7.767975330352783e-05, -6.56023621559143e-05, -5.352497100830078e-05, -4.1447579860687256e-05, -2.937018871307373e-05, -1.7292797565460205e-05, -5.21540641784668e-06, 6.861984729766846e-06, 1.893937587738037e-05, 3.1016767024993896e-05, 4.309415817260742e-05, 5.517154932022095e-05, 6.724894046783447e-05, 7.9326331615448e-05, 9.140372276306152e-05, 0.00010348111391067505, 0.00011555850505828857, 0.0001276358962059021, 0.00013971328735351562]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 7.0, 8.0, 14.0, 20.0, 31.0, 56.0, 80.0, 149.0, 295.0, 1002.0, 9550.0, 914717.0, 118698.0, 2842.0, 578.0, 221.0, 124.0, 63.0, 38.0, 26.0, 11.0, 8.0, 10.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.95703125, -1.9052276611328125, -1.853424072265625, -1.8016204833984375, -1.74981689453125, -1.6980133056640625, -1.646209716796875, -1.5944061279296875, -1.5426025390625, -1.4907989501953125, -1.438995361328125, -1.3871917724609375, -1.33538818359375, -1.2835845947265625, -1.231781005859375, -1.1799774169921875, -1.128173828125, -1.0763702392578125, -1.024566650390625, -0.9727630615234375, -0.92095947265625, -0.8691558837890625, -0.817352294921875, -0.7655487060546875, -0.7137451171875, -0.6619415283203125, -0.610137939453125, -0.5583343505859375, -0.50653076171875, -0.4547271728515625, -0.402923583984375, -0.3511199951171875, -0.29931640625, -0.2475128173828125, -0.195709228515625, -0.1439056396484375, -0.09210205078125, -0.0402984619140625, 0.011505126953125, 0.0633087158203125, 0.1151123046875, 0.1669158935546875, 0.218719482421875, 0.2705230712890625, 0.32232666015625, 0.3741302490234375, 0.425933837890625, 0.4777374267578125, 0.529541015625, 0.5813446044921875, 0.633148193359375, 0.6849517822265625, 0.73675537109375, 0.7885589599609375, 0.840362548828125, 0.8921661376953125, 0.9439697265625, 0.9957733154296875, 1.047576904296875, 1.0993804931640625, 1.15118408203125, 1.2029876708984375, 1.254791259765625, 1.3065948486328125, 1.3583984375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 11.0, 19.0, 9.0, 20.0, 28.0, 65.0, 79.0, 100.0, 97.0, 109.0, 107.0, 100.0, 89.0, 48.0, 37.0, 17.0, 16.0, 16.0, 14.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57568359375, -0.5599098205566406, -0.5441360473632812, -0.5283622741699219, -0.5125885009765625, -0.4968147277832031, -0.48104095458984375, -0.4652671813964844, -0.449493408203125, -0.4337196350097656, -0.41794586181640625, -0.4021720886230469, -0.3863983154296875, -0.3706245422363281, -0.35485076904296875, -0.3390769958496094, -0.32330322265625, -0.3075294494628906, -0.29175567626953125, -0.2759819030761719, -0.2602081298828125, -0.24443435668945312, -0.22866058349609375, -0.21288681030273438, -0.197113037109375, -0.18133926391601562, -0.16556549072265625, -0.14979171752929688, -0.1340179443359375, -0.11824417114257812, -0.10247039794921875, -0.08669662475585938, -0.0709228515625, -0.055149078369140625, -0.03937530517578125, -0.023601531982421875, -0.0078277587890625, 0.007946014404296875, 0.02371978759765625, 0.039493560791015625, 0.055267333984375, 0.07104110717773438, 0.08681488037109375, 0.10258865356445312, 0.1183624267578125, 0.13413619995117188, 0.14990997314453125, 0.16568374633789062, 0.18145751953125, 0.19723129272460938, 0.21300506591796875, 0.22877883911132812, 0.2445526123046875, 0.2603263854980469, 0.27610015869140625, 0.2918739318847656, 0.307647705078125, 0.3234214782714844, 0.33919525146484375, 0.3549690246582031, 0.3707427978515625, 0.3865165710449219, 0.40229034423828125, 0.4180641174316406, 0.433837890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 12.0, 21.0, 33.0, 67.0, 87.0, 143.0, 190.0, 162.0, 128.0, 64.0, 43.0, 24.0, 14.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.981949806213379, -7.737807750701904, -7.493666172027588, -7.249524116516113, -7.005382537841797, -6.761240482330322, -6.517098426818848, -6.272956848144531, -6.028814792633057, -5.784672737121582, -5.540531158447266, -5.296389102935791, -5.052247524261475, -4.80810546875, -4.563963890075684, -4.319821834564209, -4.075679779052734, -3.831537961959839, -3.5873961448669434, -3.3432540893554688, -3.0991122722625732, -2.8549704551696777, -2.6108286380767822, -2.3666868209838867, -2.1225452423095703, -1.8784034252166748, -1.6342614889144897, -1.3901196718215942, -1.1459777355194092, -0.9018359184265137, -0.6576941013336182, -0.4135521650314331, -0.16941022872924805, 0.07473163306713104, 0.31887349486351013, 0.563015341758728, 0.8071572184562683, 1.0512990951538086, 1.295440912246704, 1.5395828485488892, 1.7837246656417847, 2.0278666019439697, 2.2720084190368652, 2.5161502361297607, 2.7602920532226562, 3.004434108734131, 3.2485756874084473, 3.492717742919922, 3.7368595600128174, 3.981001377105713, 4.2251434326171875, 4.469285011291504, 4.7134270668029785, 4.957569122314453, 5.2017107009887695, 5.445852756500244, 5.6899943351745605, 5.934136390686035, 6.178277969360352, 6.422420024871826, 6.666561603546143, 6.910703659057617, 7.154845237731934, 7.398987293243408, 7.643129348754883]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 11.0, 8.0, 11.0, 14.0, 15.0, 13.0, 22.0, 26.0, 25.0, 36.0, 35.0, 47.0, 51.0, 42.0, 51.0, 52.0, 40.0, 51.0, 52.0, 53.0, 44.0, 40.0, 39.0, 35.0, 23.0, 24.0, 28.0, 24.0, 17.0, 14.0, 12.0, 11.0, 8.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9368813037872314, -2.835259437561035, -2.733637809753418, -2.6320159435272217, -2.5303940773010254, -2.428772449493408, -2.327150583267212, -2.2255287170410156, -2.1239070892333984, -2.022285223007202, -1.9206634759902954, -1.8190417289733887, -1.7174198627471924, -1.6157981157302856, -1.514176368713379, -1.4125545024871826, -1.3109326362609863, -1.2093108892440796, -1.1076890230178833, -1.0060672760009766, -0.904445469379425, -0.8028236627578735, -0.7012019157409668, -0.5995801091194153, -0.49795830249786377, -0.39633649587631226, -0.29471471905708313, -0.193092942237854, -0.09147113561630249, 0.010150671005249023, 0.11177241802215576, 0.21339422464370728, 0.3150162696838379, 0.4166380763053894, 0.5182598829269409, 0.6198816299438477, 0.7215034365653992, 0.8231252431869507, 0.9247469902038574, 1.0263688564300537, 1.1279906034469604, 1.2296123504638672, 1.3312342166900635, 1.4328559637069702, 1.534477710723877, 1.6360995769500732, 1.73772132396698, 1.8393430709838867, 1.940964937210083, 2.0425868034362793, 2.1442084312438965, 2.2458302974700928, 2.347452163696289, 2.4490737915039062, 2.5506956577301025, 2.652317523956299, 2.753939151763916, 2.8555610179901123, 2.9571826457977295, 3.058804512023926, 3.160426378250122, 3.2620482444763184, 3.3636698722839355, 3.465291738510132, 3.566913604736328]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 8.0, 6.0, 6.0, 10.0, 10.0, 31.0, 26.0, 58.0, 63.0, 95.0, 158.0, 388.0, 959.0, 3720.0, 36620.0, 3913386.0, 225013.0, 10465.0, 1897.0, 631.0, 309.0, 143.0, 100.0, 60.0, 39.0, 23.0, 19.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.486724853515625, -2.40313720703125, -2.319549560546875, -2.2359619140625, -2.152374267578125, -2.06878662109375, -1.985198974609375, -1.901611328125, -1.818023681640625, -1.73443603515625, -1.650848388671875, -1.5672607421875, -1.483673095703125, -1.40008544921875, -1.316497802734375, -1.23291015625, -1.149322509765625, -1.06573486328125, -0.982147216796875, -0.8985595703125, -0.814971923828125, -0.73138427734375, -0.647796630859375, -0.564208984375, -0.480621337890625, -0.39703369140625, -0.313446044921875, -0.2298583984375, -0.146270751953125, -0.06268310546875, 0.020904541015625, 0.1044921875, 0.188079833984375, 0.27166748046875, 0.355255126953125, 0.4388427734375, 0.522430419921875, 0.60601806640625, 0.689605712890625, 0.773193359375, 0.856781005859375, 0.94036865234375, 1.023956298828125, 1.1075439453125, 1.191131591796875, 1.27471923828125, 1.358306884765625, 1.44189453125, 1.525482177734375, 1.60906982421875, 1.692657470703125, 1.7762451171875, 1.859832763671875, 1.94342041015625, 2.027008056640625, 2.110595703125, 2.194183349609375, 2.27777099609375, 2.361358642578125, 2.4449462890625, 2.528533935546875, 2.61212158203125, 2.695709228515625, 2.779296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 9.0, 12.0, 16.0, 26.0, 41.0, 53.0, 63.0, 73.0, 70.0, 82.0, 81.0, 82.0, 69.0, 77.0, 57.0, 38.0, 43.0, 36.0, 16.0, 16.0, 16.0, 6.0, 6.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275390625, -0.268463134765625, -0.26153564453125, -0.254608154296875, -0.2476806640625, -0.240753173828125, -0.23382568359375, -0.226898193359375, -0.219970703125, -0.213043212890625, -0.20611572265625, -0.199188232421875, -0.1922607421875, -0.185333251953125, -0.17840576171875, -0.171478271484375, -0.16455078125, -0.157623291015625, -0.15069580078125, -0.143768310546875, -0.1368408203125, -0.129913330078125, -0.12298583984375, -0.116058349609375, -0.109130859375, -0.102203369140625, -0.09527587890625, -0.088348388671875, -0.0814208984375, -0.074493408203125, -0.06756591796875, -0.060638427734375, -0.0537109375, -0.046783447265625, -0.03985595703125, -0.032928466796875, -0.0260009765625, -0.019073486328125, -0.01214599609375, -0.005218505859375, 0.001708984375, 0.008636474609375, 0.01556396484375, 0.022491455078125, 0.0294189453125, 0.036346435546875, 0.04327392578125, 0.050201416015625, 0.05712890625, 0.064056396484375, 0.07098388671875, 0.077911376953125, 0.0848388671875, 0.091766357421875, 0.09869384765625, 0.105621337890625, 0.112548828125, 0.119476318359375, 0.12640380859375, 0.133331298828125, 0.1402587890625, 0.147186279296875, 0.15411376953125, 0.161041259765625, 0.16796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 10.0, 12.0, 19.0, 29.0, 49.0, 89.0, 114.0, 228.0, 477.0, 1644.0, 12462.0, 2526764.0, 1638130.0, 11591.0, 1576.0, 550.0, 230.0, 136.0, 57.0, 36.0, 30.0, 22.0, 14.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05078125, -2.955413818359375, -2.86004638671875, -2.764678955078125, -2.6693115234375, -2.573944091796875, -2.47857666015625, -2.383209228515625, -2.287841796875, -2.192474365234375, -2.09710693359375, -2.001739501953125, -1.9063720703125, -1.811004638671875, -1.71563720703125, -1.620269775390625, -1.52490234375, -1.429534912109375, -1.33416748046875, -1.238800048828125, -1.1434326171875, -1.048065185546875, -0.95269775390625, -0.857330322265625, -0.761962890625, -0.666595458984375, -0.57122802734375, -0.475860595703125, -0.3804931640625, -0.285125732421875, -0.18975830078125, -0.094390869140625, 0.0009765625, 0.096343994140625, 0.19171142578125, 0.287078857421875, 0.3824462890625, 0.477813720703125, 0.57318115234375, 0.668548583984375, 0.763916015625, 0.859283447265625, 0.95465087890625, 1.050018310546875, 1.1453857421875, 1.240753173828125, 1.33612060546875, 1.431488037109375, 1.52685546875, 1.622222900390625, 1.71759033203125, 1.812957763671875, 1.9083251953125, 2.003692626953125, 2.09906005859375, 2.194427490234375, 2.289794921875, 2.385162353515625, 2.48052978515625, 2.575897216796875, 2.6712646484375, 2.766632080078125, 2.86199951171875, 2.957366943359375, 3.052734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 14.0, 17.0, 27.0, 48.0, 89.0, 164.0, 377.0, 1757.0, 1028.0, 265.0, 125.0, 69.0, 31.0, 20.0, 9.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.44140625, -0.4229278564453125, -0.404449462890625, -0.3859710693359375, -0.36749267578125, -0.3490142822265625, -0.330535888671875, -0.3120574951171875, -0.2935791015625, -0.2751007080078125, -0.256622314453125, -0.2381439208984375, -0.21966552734375, -0.2011871337890625, -0.182708740234375, -0.1642303466796875, -0.145751953125, -0.1272735595703125, -0.108795166015625, -0.0903167724609375, -0.07183837890625, -0.0533599853515625, -0.034881591796875, -0.0164031982421875, 0.0020751953125, 0.0205535888671875, 0.039031982421875, 0.0575103759765625, 0.07598876953125, 0.0944671630859375, 0.112945556640625, 0.1314239501953125, 0.14990234375, 0.1683807373046875, 0.186859130859375, 0.2053375244140625, 0.22381591796875, 0.2422943115234375, 0.260772705078125, 0.2792510986328125, 0.2977294921875, 0.3162078857421875, 0.334686279296875, 0.3531646728515625, 0.37164306640625, 0.3901214599609375, 0.408599853515625, 0.4270782470703125, 0.445556640625, 0.4640350341796875, 0.482513427734375, 0.5009918212890625, 0.51947021484375, 0.5379486083984375, 0.556427001953125, 0.5749053955078125, 0.5933837890625, 0.6118621826171875, 0.630340576171875, 0.6488189697265625, 0.66729736328125, 0.6857757568359375, 0.704254150390625, 0.7227325439453125, 0.7412109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 6.0, 16.0, 56.0, 105.0, 218.0, 298.0, 182.0, 77.0, 19.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7136688232421875, -7.544812202453613, -7.375955581665039, -7.207098960876465, -7.038242340087891, -6.869385719299316, -6.700529098510742, -6.53167200088501, -6.3628153800964355, -6.193958759307861, -6.025102138519287, -5.856245517730713, -5.687388896942139, -5.518531799316406, -5.349675178527832, -5.180818557739258, -5.011961936950684, -4.843105316162109, -4.674248695373535, -4.505392074584961, -4.336535453796387, -4.1676788330078125, -3.998821973800659, -3.829965114593506, -3.66110897064209, -3.4922523498535156, -3.3233957290649414, -3.154539108276367, -2.985682249069214, -2.8168256282806396, -2.6479690074920654, -2.479112148284912, -2.310255527496338, -2.1413989067077637, -1.9725421667099, -1.8036855459213257, -1.634828805923462, -1.4659721851348877, -1.2971155643463135, -1.1282588243484497, -0.9594022035598755, -0.7905455231666565, -0.6216888427734375, -0.4528322219848633, -0.2839755415916443, -0.11511886119842529, 0.053737759590148926, 0.2225944995880127, 0.3914511203765869, 0.5603078007698059, 0.7291644811630249, 0.8980211019515991, 1.066877841949463, 1.235734462738037, 1.4045910835266113, 1.573447823524475, 1.7423044443130493, 1.9111610651016235, 2.0800178050994873, 2.2488744258880615, 2.4177310466766357, 2.586587905883789, 2.7554445266723633, 2.9243011474609375, 3.0931577682495117]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 5.0, 8.0, 9.0, 10.0, 15.0, 17.0, 14.0, 25.0, 28.0, 30.0, 36.0, 43.0, 48.0, 60.0, 61.0, 54.0, 62.0, 54.0, 56.0, 60.0, 63.0, 50.0, 41.0, 34.0, 20.0, 23.0, 20.0, 18.0, 7.0, 10.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6444146633148193, -1.5893096923828125, -1.5342048406600952, -1.4790998697280884, -1.423995018005371, -1.3688900470733643, -1.3137850761413574, -1.2586801052093506, -1.2035752534866333, -1.1484702825546265, -1.0933654308319092, -1.0382604598999023, -0.9831555485725403, -0.9280506372451782, -0.8729456663131714, -0.8178407549858093, -0.7627358436584473, -0.7076309323310852, -0.6525260210037231, -0.5974210500717163, -0.5423161387443542, -0.4872112274169922, -0.43210628628730774, -0.3770013451576233, -0.32189643383026123, -0.26679152250289917, -0.21168658137321472, -0.15658165514469147, -0.10147672891616821, -0.04637181758880615, 0.008733123540878296, 0.06383806467056274, 0.1189429759979248, 0.17404790222644806, 0.2291528284549713, 0.28425776958465576, 0.3393626809120178, 0.3944675922393799, 0.44957253336906433, 0.5046774744987488, 0.5597823858261108, 0.6148872971534729, 0.669992208480835, 0.7250971794128418, 0.7802020907402039, 0.8353070020675659, 0.8904119729995728, 0.9455168843269348, 1.0006217956542969, 1.0557267665863037, 1.110831618309021, 1.1659365892410278, 1.2210414409637451, 1.276146411895752, 1.3312513828277588, 1.3863563537597656, 1.441461205482483, 1.4965661764144897, 1.551671028137207, 1.6067759990692139, 1.6618809700012207, 1.716985821723938, 1.7720907926559448, 1.827195644378662, 1.882300615310669]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 13.0, 3.0, 7.0, 14.0, 14.0, 22.0, 22.0, 31.0, 48.0, 92.0, 131.0, 207.0, 441.0, 1009.0, 3575.0, 21835.0, 329025.0, 633819.0, 49643.0, 5835.0, 1488.0, 597.0, 243.0, 152.0, 89.0, 56.0, 37.0, 27.0, 23.0, 18.0, 8.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.6923828125, -1.6343536376953125, -1.576324462890625, -1.5182952880859375, -1.46026611328125, -1.4022369384765625, -1.344207763671875, -1.2861785888671875, -1.2281494140625, -1.1701202392578125, -1.112091064453125, -1.0540618896484375, -0.99603271484375, -0.9380035400390625, -0.879974365234375, -0.8219451904296875, -0.763916015625, -0.7058868408203125, -0.647857666015625, -0.5898284912109375, -0.53179931640625, -0.4737701416015625, -0.415740966796875, -0.3577117919921875, -0.2996826171875, -0.2416534423828125, -0.183624267578125, -0.1255950927734375, -0.06756591796875, -0.0095367431640625, 0.048492431640625, 0.1065216064453125, 0.16455078125, 0.2225799560546875, 0.280609130859375, 0.3386383056640625, 0.39666748046875, 0.4546966552734375, 0.512725830078125, 0.5707550048828125, 0.6287841796875, 0.6868133544921875, 0.744842529296875, 0.8028717041015625, 0.86090087890625, 0.9189300537109375, 0.976959228515625, 1.0349884033203125, 1.093017578125, 1.1510467529296875, 1.209075927734375, 1.2671051025390625, 1.32513427734375, 1.3831634521484375, 1.441192626953125, 1.4992218017578125, 1.5572509765625, 1.6152801513671875, 1.673309326171875, 1.7313385009765625, 1.78936767578125, 1.8473968505859375, 1.905426025390625, 1.9634552001953125, 2.021484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 16.0, 12.0, 18.0, 27.0, 34.0, 34.0, 45.0, 51.0, 66.0, 70.0, 66.0, 71.0, 67.0, 73.0, 58.0, 51.0, 49.0, 35.0, 29.0, 36.0, 23.0, 14.0, 13.0, 12.0, 8.0, 2.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.270751953125, -0.26425933837890625, -0.2577667236328125, -0.25127410888671875, -0.244781494140625, -0.23828887939453125, -0.2317962646484375, -0.22530364990234375, -0.21881103515625, -0.21231842041015625, -0.2058258056640625, -0.19933319091796875, -0.192840576171875, -0.18634796142578125, -0.1798553466796875, -0.17336273193359375, -0.1668701171875, -0.16037750244140625, -0.1538848876953125, -0.14739227294921875, -0.140899658203125, -0.13440704345703125, -0.1279144287109375, -0.12142181396484375, -0.11492919921875, -0.10843658447265625, -0.1019439697265625, -0.09545135498046875, -0.088958740234375, -0.08246612548828125, -0.0759735107421875, -0.06948089599609375, -0.06298828125, -0.05649566650390625, -0.0500030517578125, -0.04351043701171875, -0.037017822265625, -0.03052520751953125, -0.0240325927734375, -0.01753997802734375, -0.01104736328125, -0.00455474853515625, 0.0019378662109375, 0.00843048095703125, 0.014923095703125, 0.02141571044921875, 0.0279083251953125, 0.03440093994140625, 0.0408935546875, 0.04738616943359375, 0.0538787841796875, 0.06037139892578125, 0.066864013671875, 0.07335662841796875, 0.0798492431640625, 0.08634185791015625, 0.09283447265625, 0.09932708740234375, 0.1058197021484375, 0.11231231689453125, 0.118804931640625, 0.12529754638671875, 0.1317901611328125, 0.13828277587890625, 0.144775390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 12.0, 23.0, 9.0, 24.0, 37.0, 48.0, 51.0, 100.0, 209.0, 419.0, 1239.0, 3881.0, 16084.0, 80325.0, 368982.0, 441297.0, 107432.0, 20841.0, 4962.0, 1468.0, 518.0, 222.0, 113.0, 80.0, 36.0, 34.0, 28.0, 13.0, 15.0, 13.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0], "bins": [-1.0595703125, -1.0324630737304688, -1.0053558349609375, -0.9782485961914062, -0.951141357421875, -0.9240341186523438, -0.8969268798828125, -0.8698196411132812, -0.84271240234375, -0.8156051635742188, -0.7884979248046875, -0.7613906860351562, -0.734283447265625, -0.7071762084960938, -0.6800689697265625, -0.6529617309570312, -0.6258544921875, -0.5987472534179688, -0.5716400146484375, -0.5445327758789062, -0.517425537109375, -0.49031829833984375, -0.4632110595703125, -0.43610382080078125, -0.40899658203125, -0.38188934326171875, -0.3547821044921875, -0.32767486572265625, -0.300567626953125, -0.27346038818359375, -0.2463531494140625, -0.21924591064453125, -0.192138671875, -0.16503143310546875, -0.1379241943359375, -0.11081695556640625, -0.083709716796875, -0.05660247802734375, -0.0294952392578125, -0.00238800048828125, 0.02471923828125, 0.05182647705078125, 0.0789337158203125, 0.10604095458984375, 0.133148193359375, 0.16025543212890625, 0.1873626708984375, 0.21446990966796875, 0.2415771484375, 0.26868438720703125, 0.2957916259765625, 0.32289886474609375, 0.350006103515625, 0.37711334228515625, 0.4042205810546875, 0.43132781982421875, 0.45843505859375, 0.48554229736328125, 0.5126495361328125, 0.5397567749023438, 0.566864013671875, 0.5939712524414062, 0.6210784912109375, 0.6481857299804688, 0.67529296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 7.0, 12.0, 12.0, 11.0, 15.0, 19.0, 19.0, 21.0, 35.0, 40.0, 42.0, 51.0, 56.0, 66.0, 68.0, 57.0, 50.0, 72.0, 66.0, 51.0, 52.0, 34.0, 29.0, 35.0, 17.0, 24.0, 12.0, 7.0, 7.0, 9.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0595703125, -1.03350830078125, -1.0074462890625, -0.98138427734375, -0.955322265625, -0.92926025390625, -0.9031982421875, -0.87713623046875, -0.85107421875, -0.82501220703125, -0.7989501953125, -0.77288818359375, -0.746826171875, -0.72076416015625, -0.6947021484375, -0.66864013671875, -0.642578125, -0.61651611328125, -0.5904541015625, -0.56439208984375, -0.538330078125, -0.51226806640625, -0.4862060546875, -0.46014404296875, -0.43408203125, -0.40802001953125, -0.3819580078125, -0.35589599609375, -0.329833984375, -0.30377197265625, -0.2777099609375, -0.25164794921875, -0.2255859375, -0.19952392578125, -0.1734619140625, -0.14739990234375, -0.121337890625, -0.09527587890625, -0.0692138671875, -0.04315185546875, -0.01708984375, 0.00897216796875, 0.0350341796875, 0.06109619140625, 0.087158203125, 0.11322021484375, 0.1392822265625, 0.16534423828125, 0.19140625, 0.21746826171875, 0.2435302734375, 0.26959228515625, 0.295654296875, 0.32171630859375, 0.3477783203125, 0.37384033203125, 0.39990234375, 0.42596435546875, 0.4520263671875, 0.47808837890625, 0.504150390625, 0.53021240234375, 0.5562744140625, 0.58233642578125, 0.6083984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 10.0, 9.0, 15.0, 13.0, 23.0, 33.0, 44.0, 72.0, 125.0, 231.0, 521.0, 1740.0, 7855.0, 68324.0, 552323.0, 373617.0, 36398.0, 4912.0, 1323.0, 440.0, 183.0, 104.0, 60.0, 54.0, 41.0, 23.0, 14.0, 14.0, 9.0, 6.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.533203125, -0.51593017578125, -0.4986572265625, -0.48138427734375, -0.464111328125, -0.44683837890625, -0.4295654296875, -0.41229248046875, -0.39501953125, -0.37774658203125, -0.3604736328125, -0.34320068359375, -0.325927734375, -0.30865478515625, -0.2913818359375, -0.27410888671875, -0.2568359375, -0.23956298828125, -0.2222900390625, -0.20501708984375, -0.187744140625, -0.17047119140625, -0.1531982421875, -0.13592529296875, -0.11865234375, -0.10137939453125, -0.0841064453125, -0.06683349609375, -0.049560546875, -0.03228759765625, -0.0150146484375, 0.00225830078125, 0.01953125, 0.03680419921875, 0.0540771484375, 0.07135009765625, 0.088623046875, 0.10589599609375, 0.1231689453125, 0.14044189453125, 0.15771484375, 0.17498779296875, 0.1922607421875, 0.20953369140625, 0.226806640625, 0.24407958984375, 0.2613525390625, 0.27862548828125, 0.2958984375, 0.31317138671875, 0.3304443359375, 0.34771728515625, 0.364990234375, 0.38226318359375, 0.3995361328125, 0.41680908203125, 0.43408203125, 0.45135498046875, 0.4686279296875, 0.48590087890625, 0.503173828125, 0.52044677734375, 0.5377197265625, 0.55499267578125, 0.572265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 8.0, 14.0, 17.0, 21.0, 48.0, 74.0, 90.0, 141.0, 151.0, 136.0, 111.0, 72.0, 44.0, 23.0, 22.0, 16.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.0001881122589111328, -0.00018424354493618011, -0.00018037483096122742, -0.00017650611698627472, -0.00017263740301132202, -0.00016876868903636932, -0.00016489997506141663, -0.00016103126108646393, -0.00015716254711151123, -0.00015329383313655853, -0.00014942511916160583, -0.00014555640518665314, -0.00014168769121170044, -0.00013781897723674774, -0.00013395026326179504, -0.00013008154928684235, -0.00012621283531188965, -0.00012234412133693695, -0.00011847540736198425, -0.00011460669338703156, -0.00011073797941207886, -0.00010686926543712616, -0.00010300055146217346, -9.913183748722076e-05, -9.526312351226807e-05, -9.139440953731537e-05, -8.752569556236267e-05, -8.365698158740997e-05, -7.978826761245728e-05, -7.591955363750458e-05, -7.205083966255188e-05, -6.818212568759918e-05, -6.431341171264648e-05, -6.044469773769379e-05, -5.657598376274109e-05, -5.270726978778839e-05, -4.883855581283569e-05, -4.4969841837882996e-05, -4.11011278629303e-05, -3.72324138879776e-05, -3.33636999130249e-05, -2.9494985938072205e-05, -2.5626271963119507e-05, -2.175755798816681e-05, -1.788884401321411e-05, -1.4020130038261414e-05, -1.0151416063308716e-05, -6.282702088356018e-06, -2.4139881134033203e-06, 1.4547258615493774e-06, 5.323439836502075e-06, 9.192153811454773e-06, 1.306086778640747e-05, 1.692958176136017e-05, 2.0798295736312866e-05, 2.4667009711265564e-05, 2.8535723686218262e-05, 3.240443766117096e-05, 3.627315163612366e-05, 4.0141865611076355e-05, 4.401057958602905e-05, 4.787929356098175e-05, 5.174800753593445e-05, 5.5616721510887146e-05, 5.9485435485839844e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 14.0, 29.0, 35.0, 72.0, 134.0, 260.0, 696.0, 2208.0, 13769.0, 380423.0, 620703.0, 25742.0, 2989.0, 838.0, 319.0, 144.0, 61.0, 36.0, 25.0, 16.0, 12.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.59765625, -0.5738525390625, -0.550048828125, -0.5262451171875, -0.50244140625, -0.4786376953125, -0.454833984375, -0.4310302734375, -0.4072265625, -0.3834228515625, -0.359619140625, -0.3358154296875, -0.31201171875, -0.2882080078125, -0.264404296875, -0.2406005859375, -0.216796875, -0.1929931640625, -0.169189453125, -0.1453857421875, -0.12158203125, -0.0977783203125, -0.073974609375, -0.0501708984375, -0.0263671875, -0.0025634765625, 0.021240234375, 0.0450439453125, 0.06884765625, 0.0926513671875, 0.116455078125, 0.1402587890625, 0.1640625, 0.1878662109375, 0.211669921875, 0.2354736328125, 0.25927734375, 0.2830810546875, 0.306884765625, 0.3306884765625, 0.3544921875, 0.3782958984375, 0.402099609375, 0.4259033203125, 0.44970703125, 0.4735107421875, 0.497314453125, 0.5211181640625, 0.544921875, 0.5687255859375, 0.592529296875, 0.6163330078125, 0.64013671875, 0.6639404296875, 0.687744140625, 0.7115478515625, 0.7353515625, 0.7591552734375, 0.782958984375, 0.8067626953125, 0.83056640625, 0.8543701171875, 0.878173828125, 0.9019775390625, 0.92578125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 9.0, 5.0, 17.0, 21.0, 36.0, 30.0, 50.0, 66.0, 82.0, 87.0, 90.0, 116.0, 86.0, 80.0, 51.0, 49.0, 34.0, 30.0, 21.0, 12.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3115234375, -0.2994384765625, -0.287353515625, -0.2752685546875, -0.26318359375, -0.2510986328125, -0.239013671875, -0.2269287109375, -0.21484375, -0.2027587890625, -0.190673828125, -0.1785888671875, -0.16650390625, -0.1544189453125, -0.142333984375, -0.1302490234375, -0.1181640625, -0.1060791015625, -0.093994140625, -0.0819091796875, -0.06982421875, -0.0577392578125, -0.045654296875, -0.0335693359375, -0.021484375, -0.0093994140625, 0.002685546875, 0.0147705078125, 0.02685546875, 0.0389404296875, 0.051025390625, 0.0631103515625, 0.0751953125, 0.0872802734375, 0.099365234375, 0.1114501953125, 0.12353515625, 0.1356201171875, 0.147705078125, 0.1597900390625, 0.171875, 0.1839599609375, 0.196044921875, 0.2081298828125, 0.22021484375, 0.2322998046875, 0.244384765625, 0.2564697265625, 0.2685546875, 0.2806396484375, 0.292724609375, 0.3048095703125, 0.31689453125, 0.3289794921875, 0.341064453125, 0.3531494140625, 0.365234375, 0.3773193359375, 0.389404296875, 0.4014892578125, 0.41357421875, 0.4256591796875, 0.437744140625, 0.4498291015625, 0.4619140625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 17.0, 38.0, 98.0, 195.0, 307.0, 183.0, 110.0, 40.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.664787292480469, -9.301289558410645, -8.937792778015137, -8.574295043945312, -8.210797309875488, -7.847300052642822, -7.483802795410156, -7.120305061340332, -6.756807804107666, -6.393310546875, -6.029812812805176, -5.66631555557251, -5.302818298339844, -4.9393205642700195, -4.5758233070373535, -4.2123260498046875, -3.8488283157348633, -3.485330820083618, -3.121833324432373, -2.758336067199707, -2.394838571548462, -2.031341075897217, -1.6678438186645508, -1.3043463230133057, -0.9408488273620605, -0.5773513913154602, -0.21385395526885986, 0.1496434211730957, 0.5131409168243408, 0.8766384124755859, 1.240135669708252, 1.603633165359497, 1.9671306610107422, 2.3306281566619873, 2.6941256523132324, 3.0576229095458984, 3.4211204051971436, 3.7846179008483887, 4.148115158081055, 4.511612892150879, 4.875110149383545, 5.238607406616211, 5.602105140686035, 5.965602397918701, 6.329099655151367, 6.692597389221191, 7.056094646453857, 7.419591903686523, 7.783089637756348, 8.146587371826172, 8.51008415222168, 8.873581886291504, 9.237079620361328, 9.600576400756836, 9.96407413482666, 10.327571868896484, 10.691068649291992, 11.054566383361816, 11.418063163757324, 11.781560897827148, 12.145058631896973, 12.508556365966797, 12.872053146362305, 13.235550880432129, 13.599048614501953]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 10.0, 4.0, 13.0, 5.0, 8.0, 17.0, 14.0, 16.0, 24.0, 17.0, 27.0, 25.0, 31.0, 26.0, 25.0, 27.0, 32.0, 29.0, 39.0, 31.0, 36.0, 50.0, 39.0, 26.0, 30.0, 53.0, 36.0, 35.0, 25.0, 33.0, 24.0, 27.0, 18.0, 23.0, 22.0, 15.0, 17.0, 16.0, 10.0, 8.0, 10.0, 3.0, 7.0, 2.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.555950164794922, -2.475146770477295, -2.394343376159668, -2.313539743423462, -2.232736349105835, -2.151932954788208, -2.071129560470581, -1.990326166152954, -1.9095226526260376, -1.8287192583084106, -1.7479157447814941, -1.6671123504638672, -1.5863089561462402, -1.5055054426193237, -1.4247020483016968, -1.3438985347747803, -1.2630951404571533, -1.1822917461395264, -1.1014882326126099, -1.020684838294983, -0.9398813843727112, -0.8590779304504395, -0.7782745361328125, -0.6974710822105408, -0.616667628288269, -0.5358641743659973, -0.455060750246048, -0.37425732612609863, -0.2934538722038269, -0.21265041828155518, -0.13184699416160583, -0.051043570041656494, 0.029759883880615234, 0.11056332290172577, 0.1913667619228363, 0.27217018604278564, 0.3529736399650574, 0.4337770938873291, 0.514580488204956, 0.5953839421272278, 0.6761873960494995, 0.7569908499717712, 0.837794303894043, 0.9185976982116699, 0.9994011521339417, 1.0802046060562134, 1.1610080003738403, 1.2418115139007568, 1.3226149082183838, 1.4034183025360107, 1.4842218160629272, 1.5650252103805542, 1.6458287239074707, 1.7266321182250977, 1.8074355125427246, 1.8882389068603516, 1.969042420387268, 2.0498459339141846, 2.1306493282318115, 2.2114527225494385, 2.2922561168670654, 2.3730597496032715, 2.4538631439208984, 2.5346665382385254, 2.6154699325561523]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 7.0, 8.0, 10.0, 12.0, 23.0, 28.0, 31.0, 50.0, 84.0, 129.0, 246.0, 519.0, 1502.0, 6358.0, 51297.0, 3955624.0, 162089.0, 12086.0, 2387.0, 897.0, 342.0, 209.0, 104.0, 72.0, 59.0, 21.0, 17.0, 20.0, 19.0, 6.0, 1.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.714019775390625, -1.63116455078125, -1.548309326171875, -1.4654541015625, -1.382598876953125, -1.29974365234375, -1.216888427734375, -1.134033203125, -1.051177978515625, -0.96832275390625, -0.885467529296875, -0.8026123046875, -0.719757080078125, -0.63690185546875, -0.554046630859375, -0.47119140625, -0.388336181640625, -0.30548095703125, -0.222625732421875, -0.1397705078125, -0.056915283203125, 0.02593994140625, 0.108795166015625, 0.191650390625, 0.274505615234375, 0.35736083984375, 0.440216064453125, 0.5230712890625, 0.605926513671875, 0.68878173828125, 0.771636962890625, 0.8544921875, 0.937347412109375, 1.02020263671875, 1.103057861328125, 1.1859130859375, 1.268768310546875, 1.35162353515625, 1.434478759765625, 1.517333984375, 1.600189208984375, 1.68304443359375, 1.765899658203125, 1.8487548828125, 1.931610107421875, 2.01446533203125, 2.097320556640625, 2.18017578125, 2.263031005859375, 2.34588623046875, 2.428741455078125, 2.5115966796875, 2.594451904296875, 2.67730712890625, 2.760162353515625, 2.843017578125, 2.925872802734375, 3.00872802734375, 3.091583251953125, 3.1744384765625, 3.257293701171875, 3.34014892578125, 3.423004150390625, 3.505859375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 7.0, 8.0, 7.0, 16.0, 22.0, 21.0, 27.0, 25.0, 49.0, 48.0, 57.0, 58.0, 57.0, 72.0, 71.0, 67.0, 63.0, 55.0, 44.0, 42.0, 41.0, 40.0, 26.0, 16.0, 19.0, 11.0, 10.0, 6.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.2508506774902344, -0.24413299560546875, -0.23741531372070312, -0.2306976318359375, -0.22397994995117188, -0.21726226806640625, -0.21054458618164062, -0.203826904296875, -0.19710922241210938, -0.19039154052734375, -0.18367385864257812, -0.1769561767578125, -0.17023849487304688, -0.16352081298828125, -0.15680313110351562, -0.15008544921875, -0.14336776733398438, -0.13665008544921875, -0.12993240356445312, -0.1232147216796875, -0.11649703979492188, -0.10977935791015625, -0.10306167602539062, -0.096343994140625, -0.08962631225585938, -0.08290863037109375, -0.07619094848632812, -0.0694732666015625, -0.06275558471679688, -0.05603790283203125, -0.049320220947265625, -0.0426025390625, -0.035884857177734375, -0.02916717529296875, -0.022449493408203125, -0.0157318115234375, -0.009014129638671875, -0.00229644775390625, 0.004421234130859375, 0.011138916015625, 0.017856597900390625, 0.02457427978515625, 0.031291961669921875, 0.0380096435546875, 0.044727325439453125, 0.05144500732421875, 0.058162689208984375, 0.06488037109375, 0.07159805297851562, 0.07831573486328125, 0.08503341674804688, 0.0917510986328125, 0.09846878051757812, 0.10518646240234375, 0.11190414428710938, 0.118621826171875, 0.12533950805664062, 0.13205718994140625, 0.13877487182617188, 0.1454925537109375, 0.15221023559570312, 0.15892791748046875, 0.16564559936523438, 0.17236328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 7.0, 4.0, 4.0, 8.0, 6.0, 11.0, 20.0, 21.0, 30.0, 46.0, 58.0, 96.0, 149.0, 236.0, 436.0, 866.0, 1884.0, 4965.0, 17088.0, 88733.0, 3479543.0, 535310.0, 47397.0, 10815.0, 3540.0, 1446.0, 666.0, 329.0, 172.0, 109.0, 68.0, 63.0, 36.0, 26.0, 17.0, 17.0, 11.0, 5.0, 10.0, 8.0, 4.0, 8.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.2812652587890625, -1.238311767578125, -1.1953582763671875, -1.15240478515625, -1.1094512939453125, -1.066497802734375, -1.0235443115234375, -0.9805908203125, -0.9376373291015625, -0.894683837890625, -0.8517303466796875, -0.80877685546875, -0.7658233642578125, -0.722869873046875, -0.6799163818359375, -0.636962890625, -0.5940093994140625, -0.551055908203125, -0.5081024169921875, -0.46514892578125, -0.4221954345703125, -0.379241943359375, -0.3362884521484375, -0.2933349609375, -0.2503814697265625, -0.207427978515625, -0.1644744873046875, -0.12152099609375, -0.0785675048828125, -0.035614013671875, 0.0073394775390625, 0.05029296875, 0.0932464599609375, 0.136199951171875, 0.1791534423828125, 0.22210693359375, 0.2650604248046875, 0.308013916015625, 0.3509674072265625, 0.3939208984375, 0.4368743896484375, 0.479827880859375, 0.5227813720703125, 0.56573486328125, 0.6086883544921875, 0.651641845703125, 0.6945953369140625, 0.737548828125, 0.7805023193359375, 0.823455810546875, 0.8664093017578125, 0.90936279296875, 0.9523162841796875, 0.995269775390625, 1.0382232666015625, 1.0811767578125, 1.1241302490234375, 1.167083740234375, 1.2100372314453125, 1.25299072265625, 1.2959442138671875, 1.338897705078125, 1.3818511962890625, 1.4248046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 6.0, 12.0, 3.0, 13.0, 21.0, 23.0, 51.0, 79.0, 126.0, 263.0, 1483.0, 1294.0, 293.0, 130.0, 90.0, 49.0, 44.0, 29.0, 15.0, 23.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.64794921875, -0.633544921875, -0.619140625, -0.604736328125, -0.59033203125, -0.575927734375, -0.5615234375, -0.547119140625, -0.53271484375, -0.518310546875, -0.50390625, -0.489501953125, -0.47509765625, -0.460693359375, -0.4462890625, -0.431884765625, -0.41748046875, -0.403076171875, -0.388671875, -0.374267578125, -0.35986328125, -0.345458984375, -0.3310546875, -0.316650390625, -0.30224609375, -0.287841796875, -0.2734375, -0.259033203125, -0.24462890625, -0.230224609375, -0.2158203125, -0.201416015625, -0.18701171875, -0.172607421875, -0.158203125, -0.143798828125, -0.12939453125, -0.114990234375, -0.1005859375, -0.086181640625, -0.07177734375, -0.057373046875, -0.04296875, -0.028564453125, -0.01416015625, 0.000244140625, 0.0146484375, 0.029052734375, 0.04345703125, 0.057861328125, 0.072265625, 0.086669921875, 0.10107421875, 0.115478515625, 0.1298828125, 0.144287109375, 0.15869140625, 0.173095703125, 0.1875, 0.201904296875, 0.21630859375, 0.230712890625, 0.2451171875, 0.259521484375, 0.27392578125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 55.0, 205.0, 406.0, 243.0, 65.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.044795513153076, -6.840387344360352, -6.635979175567627, -6.431571006774902, -6.2271623611450195, -6.022754192352295, -5.81834602355957, -5.613937854766846, -5.409529685974121, -5.2051215171813965, -5.000713348388672, -4.796304702758789, -4.5918965339660645, -4.38748836517334, -4.183080196380615, -3.9786720275878906, -3.774263381958008, -3.569855213165283, -3.3654468059539795, -3.161038637161255, -2.956630229949951, -2.7522220611572266, -2.547813892364502, -2.3434057235717773, -2.1389973163604736, -1.9345890283584595, -1.7301807403564453, -1.5257725715637207, -1.3213642835617065, -1.1169559955596924, -0.9125478267669678, -0.7081395387649536, -0.5037307739257812, -0.2993225157260895, -0.0949142575263977, 0.10949397087097168, 0.31390225887298584, 0.518310546875, 0.7227187156677246, 0.9271270036697388, 1.131535291671753, 1.335943579673767, 1.5403518676757812, 1.7447600364685059, 1.94916832447052, 2.153576612472534, 2.357984781265259, 2.5623931884765625, 2.766801357269287, 2.9712095260620117, 3.1756179332733154, 3.38002610206604, 3.5844345092773438, 3.7888426780700684, 3.993250846862793, 4.197659015655518, 4.402067184448242, 4.606475353240967, 4.810883522033691, 5.015292167663574, 5.219700336456299, 5.424108505249023, 5.628516674041748, 5.832924842834473, 6.0373334884643555]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 9.0, 5.0, 12.0, 15.0, 18.0, 18.0, 23.0, 27.0, 35.0, 41.0, 57.0, 51.0, 46.0, 64.0, 52.0, 59.0, 52.0, 60.0, 56.0, 42.0, 63.0, 37.0, 34.0, 28.0, 27.0, 20.0, 12.0, 7.0, 12.0, 6.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.8850996494293213, -1.8407809734344482, -1.7964622974395752, -1.7521436214447021, -1.707824945449829, -1.6635061502456665, -1.6191874742507935, -1.5748687982559204, -1.5305501222610474, -1.4862314462661743, -1.4419127702713013, -1.3975940942764282, -1.3532752990722656, -1.3089566230773926, -1.2646379470825195, -1.2203192710876465, -1.1760005950927734, -1.1316819190979004, -1.0873632431030273, -1.0430445671081543, -0.9987258315086365, -0.9544071555137634, -0.9100884199142456, -0.8657697439193726, -0.8214510679244995, -0.7771323919296265, -0.7328137159347534, -0.6884949803352356, -0.6441763043403625, -0.5998576283454895, -0.5555388927459717, -0.5112202167510986, -0.46690165996551514, -0.4225829839706421, -0.37826427817344666, -0.3339455723762512, -0.2896268963813782, -0.24530820548534393, -0.2009895145893097, -0.15667080879211426, -0.11235213279724121, -0.06803344190120697, -0.02371475100517273, 0.02060393989086151, 0.06492263078689575, 0.10924132168292999, 0.15356001257896423, 0.19787871837615967, 0.24219739437103271, 0.28651607036590576, 0.3308347761631012, 0.37515348196029663, 0.4194721579551697, 0.4637908339500427, 0.5081095695495605, 0.5524282455444336, 0.5967469215393066, 0.6410655975341797, 0.6853842735290527, 0.7297030091285706, 0.7740216851234436, 0.8183403611183167, 0.8626590967178345, 0.9069777727127075, 0.9512964487075806]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 10.0, 4.0, 4.0, 10.0, 17.0, 17.0, 30.0, 41.0, 64.0, 122.0, 198.0, 361.0, 811.0, 2608.0, 13573.0, 167036.0, 728369.0, 120701.0, 10729.0, 2232.0, 769.0, 344.0, 193.0, 105.0, 63.0, 42.0, 34.0, 18.0, 12.0, 16.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.80859375, -1.747161865234375, -1.68572998046875, -1.624298095703125, -1.5628662109375, -1.501434326171875, -1.44000244140625, -1.378570556640625, -1.317138671875, -1.255706787109375, -1.19427490234375, -1.132843017578125, -1.0714111328125, -1.009979248046875, -0.94854736328125, -0.887115478515625, -0.82568359375, -0.764251708984375, -0.70281982421875, -0.641387939453125, -0.5799560546875, -0.518524169921875, -0.45709228515625, -0.395660400390625, -0.334228515625, -0.272796630859375, -0.21136474609375, -0.149932861328125, -0.0885009765625, -0.027069091796875, 0.03436279296875, 0.095794677734375, 0.1572265625, 0.218658447265625, 0.28009033203125, 0.341522216796875, 0.4029541015625, 0.464385986328125, 0.52581787109375, 0.587249755859375, 0.648681640625, 0.710113525390625, 0.77154541015625, 0.832977294921875, 0.8944091796875, 0.955841064453125, 1.01727294921875, 1.078704833984375, 1.14013671875, 1.201568603515625, 1.26300048828125, 1.324432373046875, 1.3858642578125, 1.447296142578125, 1.50872802734375, 1.570159912109375, 1.631591796875, 1.693023681640625, 1.75445556640625, 1.815887451171875, 1.8773193359375, 1.938751220703125, 2.00018310546875, 2.061614990234375, 2.123046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 11.0, 19.0, 21.0, 14.0, 35.0, 48.0, 42.0, 56.0, 47.0, 54.0, 62.0, 61.0, 70.0, 59.0, 77.0, 60.0, 46.0, 37.0, 37.0, 23.0, 29.0, 13.0, 19.0, 13.0, 11.0, 9.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2744140625, -0.2673912048339844, -0.26036834716796875, -0.2533454895019531, -0.2463226318359375, -0.23929977416992188, -0.23227691650390625, -0.22525405883789062, -0.218231201171875, -0.21120834350585938, -0.20418548583984375, -0.19716262817382812, -0.1901397705078125, -0.18311691284179688, -0.17609405517578125, -0.16907119750976562, -0.16204833984375, -0.15502548217773438, -0.14800262451171875, -0.14097976684570312, -0.1339569091796875, -0.12693405151367188, -0.11991119384765625, -0.11288833618164062, -0.105865478515625, -0.09884262084960938, -0.09181976318359375, -0.08479690551757812, -0.0777740478515625, -0.07075119018554688, -0.06372833251953125, -0.056705474853515625, -0.0496826171875, -0.042659759521484375, -0.03563690185546875, -0.028614044189453125, -0.0215911865234375, -0.014568328857421875, -0.00754547119140625, -0.000522613525390625, 0.006500244140625, 0.013523101806640625, 0.02054595947265625, 0.027568817138671875, 0.0345916748046875, 0.041614532470703125, 0.04863739013671875, 0.055660247802734375, 0.06268310546875, 0.06970596313476562, 0.07672882080078125, 0.08375167846679688, 0.0907745361328125, 0.09779739379882812, 0.10482025146484375, 0.11184310913085938, 0.118865966796875, 0.12588882446289062, 0.13291168212890625, 0.13993453979492188, 0.1469573974609375, 0.15398025512695312, 0.16100311279296875, 0.16802597045898438, 0.175048828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 8.0, 11.0, 10.0, 14.0, 18.0, 32.0, 34.0, 38.0, 92.0, 74.0, 126.0, 149.0, 234.0, 333.0, 509.0, 996.0, 2424.0, 6659.0, 23159.0, 93412.0, 323846.0, 405042.0, 140982.0, 34531.0, 9527.0, 3110.0, 1298.0, 623.0, 361.0, 246.0, 176.0, 120.0, 89.0, 82.0, 39.0, 51.0, 30.0, 17.0, 14.0, 11.0, 13.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6611328125, -0.63677978515625, -0.6124267578125, -0.58807373046875, -0.563720703125, -0.53936767578125, -0.5150146484375, -0.49066162109375, -0.46630859375, -0.44195556640625, -0.4176025390625, -0.39324951171875, -0.368896484375, -0.34454345703125, -0.3201904296875, -0.29583740234375, -0.271484375, -0.24713134765625, -0.2227783203125, -0.19842529296875, -0.174072265625, -0.14971923828125, -0.1253662109375, -0.10101318359375, -0.07666015625, -0.05230712890625, -0.0279541015625, -0.00360107421875, 0.020751953125, 0.04510498046875, 0.0694580078125, 0.09381103515625, 0.1181640625, 0.14251708984375, 0.1668701171875, 0.19122314453125, 0.215576171875, 0.23992919921875, 0.2642822265625, 0.28863525390625, 0.31298828125, 0.33734130859375, 0.3616943359375, 0.38604736328125, 0.410400390625, 0.43475341796875, 0.4591064453125, 0.48345947265625, 0.5078125, 0.53216552734375, 0.5565185546875, 0.58087158203125, 0.605224609375, 0.62957763671875, 0.6539306640625, 0.67828369140625, 0.70263671875, 0.72698974609375, 0.7513427734375, 0.77569580078125, 0.800048828125, 0.82440185546875, 0.8487548828125, 0.87310791015625, 0.8974609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 4.0, 14.0, 9.0, 5.0, 11.0, 10.0, 25.0, 38.0, 31.0, 33.0, 30.0, 38.0, 48.0, 49.0, 42.0, 66.0, 63.0, 39.0, 40.0, 45.0, 40.0, 42.0, 32.0, 40.0, 41.0, 38.0, 24.0, 17.0, 18.0, 15.0, 17.0, 6.0, 6.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69091796875, -0.6640548706054688, -0.6371917724609375, -0.6103286743164062, -0.583465576171875, -0.5566024780273438, -0.5297393798828125, -0.5028762817382812, -0.47601318359375, -0.44915008544921875, -0.4222869873046875, -0.39542388916015625, -0.368560791015625, -0.34169769287109375, -0.3148345947265625, -0.28797149658203125, -0.2611083984375, -0.23424530029296875, -0.2073822021484375, -0.18051910400390625, -0.153656005859375, -0.12679290771484375, -0.0999298095703125, -0.07306671142578125, -0.04620361328125, -0.01934051513671875, 0.0075225830078125, 0.03438568115234375, 0.061248779296875, 0.08811187744140625, 0.1149749755859375, 0.14183807373046875, 0.168701171875, 0.19556427001953125, 0.2224273681640625, 0.24929046630859375, 0.276153564453125, 0.30301666259765625, 0.3298797607421875, 0.35674285888671875, 0.38360595703125, 0.41046905517578125, 0.4373321533203125, 0.46419525146484375, 0.491058349609375, 0.5179214477539062, 0.5447845458984375, 0.5716476440429688, 0.5985107421875, 0.6253738403320312, 0.6522369384765625, 0.6791000366210938, 0.705963134765625, 0.7328262329101562, 0.7596893310546875, 0.7865524291992188, 0.81341552734375, 0.8402786254882812, 0.8671417236328125, 0.8940048217773438, 0.920867919921875, 0.9477310180664062, 0.9745941162109375, 1.0014572143554688, 1.0283203125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 15.0, 10.0, 15.0, 19.0, 29.0, 53.0, 97.0, 207.0, 374.0, 974.0, 3120.0, 16426.0, 168183.0, 723187.0, 118795.0, 12899.0, 2554.0, 844.0, 380.0, 167.0, 91.0, 55.0, 23.0, 8.0, 8.0, 3.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68994140625, -0.6679916381835938, -0.6460418701171875, -0.6240921020507812, -0.602142333984375, -0.5801925659179688, -0.5582427978515625, -0.5362930297851562, -0.51434326171875, -0.49239349365234375, -0.4704437255859375, -0.44849395751953125, -0.426544189453125, -0.40459442138671875, -0.3826446533203125, -0.36069488525390625, -0.3387451171875, -0.31679534912109375, -0.2948455810546875, -0.27289581298828125, -0.250946044921875, -0.22899627685546875, -0.2070465087890625, -0.18509674072265625, -0.16314697265625, -0.14119720458984375, -0.1192474365234375, -0.09729766845703125, -0.075347900390625, -0.05339813232421875, -0.0314483642578125, -0.00949859619140625, 0.012451171875, 0.03440093994140625, 0.0563507080078125, 0.07830047607421875, 0.100250244140625, 0.12220001220703125, 0.1441497802734375, 0.16609954833984375, 0.18804931640625, 0.20999908447265625, 0.2319488525390625, 0.25389862060546875, 0.275848388671875, 0.29779815673828125, 0.3197479248046875, 0.34169769287109375, 0.3636474609375, 0.38559722900390625, 0.4075469970703125, 0.42949676513671875, 0.451446533203125, 0.47339630126953125, 0.4953460693359375, 0.5172958374023438, 0.53924560546875, 0.5611953735351562, 0.5831451416015625, 0.6050949096679688, 0.627044677734375, 0.6489944458007812, 0.6709442138671875, 0.6928939819335938, 0.71484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 9.0, 6.0, 10.0, 16.0, 16.0, 22.0, 37.0, 45.0, 44.0, 72.0, 90.0, 99.0, 104.0, 90.0, 62.0, 55.0, 59.0, 27.0, 24.0, 23.0, 17.0, 15.0, 13.0, 9.0, 5.0, 3.0, 5.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00010752677917480469, -0.00010478124022483826, -0.00010203570127487183, -9.92901623249054e-05, -9.654462337493896e-05, -9.379908442497253e-05, -9.10535454750061e-05, -8.830800652503967e-05, -8.556246757507324e-05, -8.281692862510681e-05, -8.007138967514038e-05, -7.732585072517395e-05, -7.458031177520752e-05, -7.183477282524109e-05, -6.908923387527466e-05, -6.634369492530823e-05, -6.35981559753418e-05, -6.0852617025375366e-05, -5.8107078075408936e-05, -5.5361539125442505e-05, -5.2616000175476074e-05, -4.9870461225509644e-05, -4.712492227554321e-05, -4.437938332557678e-05, -4.163384437561035e-05, -3.888830542564392e-05, -3.614276647567749e-05, -3.339722752571106e-05, -3.065168857574463e-05, -2.7906149625778198e-05, -2.5160610675811768e-05, -2.2415071725845337e-05, -1.9669532775878906e-05, -1.6923993825912476e-05, -1.4178454875946045e-05, -1.1432915925979614e-05, -8.687376976013184e-06, -5.941838026046753e-06, -3.1962990760803223e-06, -4.507601261138916e-07, 2.294778823852539e-06, 5.04031777381897e-06, 7.7858567237854e-06, 1.0531395673751831e-05, 1.3276934623718262e-05, 1.6022473573684692e-05, 1.8768012523651123e-05, 2.1513551473617554e-05, 2.4259090423583984e-05, 2.7004629373550415e-05, 2.9750168323516846e-05, 3.2495707273483276e-05, 3.524124622344971e-05, 3.798678517341614e-05, 4.073232412338257e-05, 4.3477863073349e-05, 4.622340202331543e-05, 4.896894097328186e-05, 5.171447992324829e-05, 5.446001887321472e-05, 5.720555782318115e-05, 5.995109677314758e-05, 6.269663572311401e-05, 6.544217467308044e-05, 6.818771362304688e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 11.0, 12.0, 35.0, 52.0, 123.0, 180.0, 530.0, 1973.0, 15414.0, 380342.0, 618642.0, 27328.0, 2744.0, 650.0, 268.0, 123.0, 59.0, 27.0, 16.0, 12.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.2338790893554688, -1.2031097412109375, -1.1723403930664062, -1.141571044921875, -1.1108016967773438, -1.0800323486328125, -1.0492630004882812, -1.01849365234375, -0.9877243041992188, -0.9569549560546875, -0.9261856079101562, -0.895416259765625, -0.8646469116210938, -0.8338775634765625, -0.8031082153320312, -0.7723388671875, -0.7415695190429688, -0.7108001708984375, -0.6800308227539062, -0.649261474609375, -0.6184921264648438, -0.5877227783203125, -0.5569534301757812, -0.52618408203125, -0.49541473388671875, -0.4646453857421875, -0.43387603759765625, -0.403106689453125, -0.37233734130859375, -0.3415679931640625, -0.31079864501953125, -0.280029296875, -0.24925994873046875, -0.2184906005859375, -0.18772125244140625, -0.156951904296875, -0.12618255615234375, -0.0954132080078125, -0.06464385986328125, -0.03387451171875, -0.00310516357421875, 0.0276641845703125, 0.05843353271484375, 0.089202880859375, 0.11997222900390625, 0.1507415771484375, 0.18151092529296875, 0.2122802734375, 0.24304962158203125, 0.2738189697265625, 0.30458831787109375, 0.335357666015625, 0.36612701416015625, 0.3968963623046875, 0.42766571044921875, 0.45843505859375, 0.48920440673828125, 0.5199737548828125, 0.5507431030273438, 0.581512451171875, 0.6122817993164062, 0.6430511474609375, 0.6738204956054688, 0.70458984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 3.0, 14.0, 13.0, 27.0, 32.0, 40.0, 49.0, 68.0, 89.0, 93.0, 117.0, 102.0, 80.0, 69.0, 53.0, 44.0, 35.0, 19.0, 12.0, 10.0, 5.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5556640625, -0.53912353515625, -0.5225830078125, -0.50604248046875, -0.489501953125, -0.47296142578125, -0.4564208984375, -0.43988037109375, -0.42333984375, -0.40679931640625, -0.3902587890625, -0.37371826171875, -0.357177734375, -0.34063720703125, -0.3240966796875, -0.30755615234375, -0.291015625, -0.27447509765625, -0.2579345703125, -0.24139404296875, -0.224853515625, -0.20831298828125, -0.1917724609375, -0.17523193359375, -0.15869140625, -0.14215087890625, -0.1256103515625, -0.10906982421875, -0.092529296875, -0.07598876953125, -0.0594482421875, -0.04290771484375, -0.0263671875, -0.00982666015625, 0.0067138671875, 0.02325439453125, 0.039794921875, 0.05633544921875, 0.0728759765625, 0.08941650390625, 0.10595703125, 0.12249755859375, 0.1390380859375, 0.15557861328125, 0.172119140625, 0.18865966796875, 0.2052001953125, 0.22174072265625, 0.23828125, 0.25482177734375, 0.2713623046875, 0.28790283203125, 0.304443359375, 0.32098388671875, 0.3375244140625, 0.35406494140625, 0.37060546875, 0.38714599609375, 0.4036865234375, 0.42022705078125, 0.436767578125, 0.45330810546875, 0.4698486328125, 0.48638916015625, 0.5029296875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 13.0, 28.0, 69.0, 89.0, 131.0, 165.0, 172.0, 145.0, 91.0, 46.0, 36.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.52730941772461, -13.234052658081055, -12.940794944763184, -12.647537231445312, -12.354280471801758, -12.061023712158203, -11.767765998840332, -11.474508285522461, -11.181251525878906, -10.887994766235352, -10.59473705291748, -10.30147933959961, -10.008222579956055, -9.7149658203125, -9.421708106994629, -9.128450393676758, -8.835193634033203, -8.541936874389648, -8.248679161071777, -7.9554219245910645, -7.662164688110352, -7.368907451629639, -7.075650215148926, -6.782392978668213, -6.4891357421875, -6.195878505706787, -5.902621269226074, -5.609364032745361, -5.316106796264648, -5.0228495597839355, -4.729592323303223, -4.43633508682251, -4.1430768966674805, -3.8498196601867676, -3.5565624237060547, -3.263305187225342, -2.970047950744629, -2.676790714263916, -2.383533477783203, -2.0902762413024902, -1.7970190048217773, -1.5037617683410645, -1.2105045318603516, -0.9172472953796387, -0.6239900588989258, -0.3307328224182129, -0.0374755859375, 0.2557816505432129, 0.5490388870239258, 0.8422961235046387, 1.1355533599853516, 1.4288105964660645, 1.7220678329467773, 2.0153250694274902, 2.308582305908203, 2.601839542388916, 2.895096778869629, 3.188354015350342, 3.4816112518310547, 3.7748684883117676, 4.0681257247924805, 4.361382961273193, 4.654640197753906, 4.947897434234619, 5.241154670715332]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 9.0, 8.0, 14.0, 17.0, 25.0, 24.0, 41.0, 25.0, 31.0, 30.0, 54.0, 39.0, 34.0, 38.0, 42.0, 42.0, 50.0, 51.0, 36.0, 41.0, 36.0, 45.0, 38.0, 27.0, 35.0, 22.0, 22.0, 19.0, 20.0, 12.0, 18.0, 13.0, 10.0, 8.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6102945804595947, -3.4762771129608154, -3.3422598838806152, -3.208242416381836, -3.0742249488830566, -2.9402074813842773, -2.806190013885498, -2.672172784805298, -2.5381553173065186, -2.4041378498077393, -2.270120620727539, -2.1361031532287598, -2.0020856857299805, -1.8680682182312012, -1.7340508699417114, -1.6000335216522217, -1.4660160541534424, -1.331998586654663, -1.1979812383651733, -1.0639638900756836, -0.9299464225769043, -0.7959290146827698, -0.6619116067886353, -0.5278941988945007, -0.3938767910003662, -0.2598593831062317, -0.12584197521209717, 0.008175432682037354, 0.14219284057617188, 0.2762102484703064, 0.4102276563644409, 0.5442450642585754, 0.6782627105712891, 0.8122801184654236, 0.9462975263595581, 1.0803148746490479, 1.2143323421478271, 1.3483498096466064, 1.4823671579360962, 1.616384506225586, 1.7504019737243652, 1.8844194412231445, 2.018436908721924, 2.152454137802124, 2.2864716053009033, 2.4204890727996826, 2.554506301879883, 2.688523769378662, 2.8225412368774414, 2.9565587043762207, 3.090576171875, 3.2245934009552, 3.3586108684539795, 3.492628335952759, 3.626645565032959, 3.7606630325317383, 3.8946805000305176, 4.028697967529297, 4.162715435028076, 4.2967329025268555, 4.430749893188477, 4.564767360687256, 4.698784828186035, 4.8328022956848145, 4.966819763183594]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 3.0, 8.0, 13.0, 9.0, 15.0, 29.0, 27.0, 59.0, 99.0, 127.0, 305.0, 772.0, 3422.0, 33518.0, 4007929.0, 137681.0, 7688.0, 1531.0, 540.0, 234.0, 115.0, 62.0, 36.0, 23.0, 11.0, 12.0, 4.0, 8.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.908203125, -1.806182861328125, -1.70416259765625, -1.602142333984375, -1.5001220703125, -1.398101806640625, -1.29608154296875, -1.194061279296875, -1.092041015625, -0.990020751953125, -0.88800048828125, -0.785980224609375, -0.6839599609375, -0.581939697265625, -0.47991943359375, -0.377899169921875, -0.27587890625, -0.173858642578125, -0.07183837890625, 0.030181884765625, 0.1322021484375, 0.234222412109375, 0.33624267578125, 0.438262939453125, 0.540283203125, 0.642303466796875, 0.74432373046875, 0.846343994140625, 0.9483642578125, 1.050384521484375, 1.15240478515625, 1.254425048828125, 1.3564453125, 1.458465576171875, 1.56048583984375, 1.662506103515625, 1.7645263671875, 1.866546630859375, 1.96856689453125, 2.070587158203125, 2.172607421875, 2.274627685546875, 2.37664794921875, 2.478668212890625, 2.5806884765625, 2.682708740234375, 2.78472900390625, 2.886749267578125, 2.98876953125, 3.090789794921875, 3.19281005859375, 3.294830322265625, 3.3968505859375, 3.498870849609375, 3.60089111328125, 3.702911376953125, 3.804931640625, 3.906951904296875, 4.00897216796875, 4.110992431640625, 4.2130126953125, 4.315032958984375, 4.41705322265625, 4.519073486328125, 4.62109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 13.0, 15.0, 13.0, 21.0, 30.0, 46.0, 41.0, 42.0, 43.0, 50.0, 67.0, 53.0, 62.0, 73.0, 53.0, 61.0, 55.0, 36.0, 37.0, 41.0, 31.0, 26.0, 22.0, 14.0, 14.0, 11.0, 3.0, 8.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.284912109375, -0.2776031494140625, -0.270294189453125, -0.2629852294921875, -0.25567626953125, -0.2483673095703125, -0.241058349609375, -0.2337493896484375, -0.2264404296875, -0.2191314697265625, -0.211822509765625, -0.2045135498046875, -0.19720458984375, -0.1898956298828125, -0.182586669921875, -0.1752777099609375, -0.16796875, -0.1606597900390625, -0.153350830078125, -0.1460418701171875, -0.13873291015625, -0.1314239501953125, -0.124114990234375, -0.1168060302734375, -0.1094970703125, -0.1021881103515625, -0.094879150390625, -0.0875701904296875, -0.08026123046875, -0.0729522705078125, -0.065643310546875, -0.0583343505859375, -0.051025390625, -0.0437164306640625, -0.036407470703125, -0.0290985107421875, -0.02178955078125, -0.0144805908203125, -0.007171630859375, 0.0001373291015625, 0.0074462890625, 0.0147552490234375, 0.022064208984375, 0.0293731689453125, 0.03668212890625, 0.0439910888671875, 0.051300048828125, 0.0586090087890625, 0.06591796875, 0.0732269287109375, 0.080535888671875, 0.0878448486328125, 0.09515380859375, 0.1024627685546875, 0.109771728515625, 0.1170806884765625, 0.1243896484375, 0.1316986083984375, 0.139007568359375, 0.1463165283203125, 0.15362548828125, 0.1609344482421875, 0.168243408203125, 0.1755523681640625, 0.182861328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 9.0, 18.0, 29.0, 52.0, 94.0, 151.0, 282.0, 485.0, 792.0, 1529.0, 3131.0, 7602.0, 26910.0, 174221.0, 3700974.0, 230766.0, 31712.0, 8424.0, 3334.0, 1727.0, 873.0, 513.0, 268.0, 163.0, 97.0, 50.0, 34.0, 16.0, 9.0, 6.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.27734375, -1.2368621826171875, -1.196380615234375, -1.1558990478515625, -1.11541748046875, -1.0749359130859375, -1.034454345703125, -0.9939727783203125, -0.9534912109375, -0.9130096435546875, -0.872528076171875, -0.8320465087890625, -0.79156494140625, -0.7510833740234375, -0.710601806640625, -0.6701202392578125, -0.629638671875, -0.5891571044921875, -0.548675537109375, -0.5081939697265625, -0.46771240234375, -0.4272308349609375, -0.386749267578125, -0.3462677001953125, -0.3057861328125, -0.2653045654296875, -0.224822998046875, -0.1843414306640625, -0.14385986328125, -0.1033782958984375, -0.062896728515625, -0.0224151611328125, 0.01806640625, 0.0585479736328125, 0.099029541015625, 0.1395111083984375, 0.17999267578125, 0.2204742431640625, 0.260955810546875, 0.3014373779296875, 0.3419189453125, 0.3824005126953125, 0.422882080078125, 0.4633636474609375, 0.50384521484375, 0.5443267822265625, 0.584808349609375, 0.6252899169921875, 0.665771484375, 0.7062530517578125, 0.746734619140625, 0.7872161865234375, 0.82769775390625, 0.8681793212890625, 0.908660888671875, 0.9491424560546875, 0.9896240234375, 1.0301055908203125, 1.070587158203125, 1.1110687255859375, 1.15155029296875, 1.1920318603515625, 1.232513427734375, 1.2729949951171875, 1.3134765625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 7.0, 5.0, 4.0, 9.0, 11.0, 19.0, 29.0, 37.0, 96.0, 167.0, 463.0, 2191.0, 587.0, 194.0, 82.0, 57.0, 28.0, 29.0, 12.0, 16.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66748046875, -0.6463394165039062, -0.6251983642578125, -0.6040573120117188, -0.582916259765625, -0.5617752075195312, -0.5406341552734375, -0.5194931030273438, -0.49835205078125, -0.47721099853515625, -0.4560699462890625, -0.43492889404296875, -0.413787841796875, -0.39264678955078125, -0.3715057373046875, -0.35036468505859375, -0.3292236328125, -0.30808258056640625, -0.2869415283203125, -0.26580047607421875, -0.244659423828125, -0.22351837158203125, -0.2023773193359375, -0.18123626708984375, -0.16009521484375, -0.13895416259765625, -0.1178131103515625, -0.09667205810546875, -0.075531005859375, -0.05438995361328125, -0.0332489013671875, -0.01210784912109375, 0.009033203125, 0.03017425537109375, 0.0513153076171875, 0.07245635986328125, 0.093597412109375, 0.11473846435546875, 0.1358795166015625, 0.15702056884765625, 0.17816162109375, 0.19930267333984375, 0.2204437255859375, 0.24158477783203125, 0.262725830078125, 0.28386688232421875, 0.3050079345703125, 0.32614898681640625, 0.3472900390625, 0.36843109130859375, 0.3895721435546875, 0.41071319580078125, 0.431854248046875, 0.45299530029296875, 0.4741363525390625, 0.49527740478515625, 0.51641845703125, 0.5375595092773438, 0.5587005615234375, 0.5798416137695312, 0.600982666015625, 0.6221237182617188, 0.6432647705078125, 0.6644058227539062, 0.685546875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 6.0, 20.0, 42.0, 119.0, 241.0, 247.0, 174.0, 80.0, 32.0, 18.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0390124320983887, -2.8628294467926025, -2.6866466999053955, -2.5104637145996094, -2.3342809677124023, -2.158097982406616, -1.98191499710083, -1.8057321310043335, -1.629549264907837, -1.4533663988113403, -1.2771835327148438, -1.1010005474090576, -0.924817681312561, -0.7486348152160645, -0.5724518299102783, -0.39626896381378174, -0.22008609771728516, -0.043903201818466187, 0.13227969408035278, 0.30846261978149414, 0.4846454858779907, 0.6608283519744873, 0.8370113372802734, 1.01319420337677, 1.1893770694732666, 1.3655599355697632, 1.5417428016662598, 1.717925786972046, 1.8941086530685425, 2.070291519165039, 2.246474504470825, 2.4226574897766113, 2.59883975982666, 2.7750227451324463, 2.9512054920196533, 3.1273884773254395, 3.3035712242126465, 3.4797542095184326, 3.6559371948242188, 3.832119941711426, 4.008302688598633, 4.18448543548584, 4.360668659210205, 4.536851406097412, 4.713034152984619, 4.889217376708984, 5.065400123596191, 5.241582870483398, 5.417766094207764, 5.593948841094971, 5.770132064819336, 5.946314811706543, 6.12249755859375, 6.298680305480957, 6.474863529205322, 6.651046276092529, 6.8272294998168945, 7.003412246704102, 7.179595470428467, 7.355778217315674, 7.531960964202881, 7.708144187927246, 7.884326934814453, 8.06050968170166, 8.236692428588867]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 10.0, 11.0, 6.0, 10.0, 15.0, 20.0, 27.0, 32.0, 37.0, 31.0, 37.0, 41.0, 45.0, 53.0, 57.0, 61.0, 56.0, 36.0, 50.0, 49.0, 62.0, 38.0, 46.0, 25.0, 20.0, 17.0, 24.0, 14.0, 9.0, 10.0, 11.0, 8.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.198601007461548, -2.1419484615325928, -2.0852956771850586, -2.0286431312561035, -1.9719904661178589, -1.9153378009796143, -1.8586851358413696, -1.802032470703125, -1.74537992477417, -1.6887272596359253, -1.6320745944976807, -1.5754220485687256, -1.518769383430481, -1.4621167182922363, -1.4054640531539917, -1.348811388015747, -1.2921587228775024, -1.2355060577392578, -1.1788533926010132, -1.1222007274627686, -1.0655481815338135, -1.0088955163955688, -0.9522428512573242, -0.8955901861190796, -0.8389375805854797, -0.7822849154472351, -0.7256323099136353, -0.6689796447753906, -0.612326979637146, -0.5556743741035461, -0.4990217089653015, -0.4423690736293793, -0.38571643829345703, -0.3290638029575348, -0.27241116762161255, -0.21575850248336792, -0.15910586714744568, -0.10245323181152344, -0.04580056667327881, 0.010852068662643433, 0.06750470399856567, 0.12415734678506851, 0.18080998957157135, 0.23746263980865479, 0.294115275144577, 0.35076791048049927, 0.4074205756187439, 0.46407321095466614, 0.5207258462905884, 0.577378511428833, 0.6340311169624329, 0.6906837821006775, 0.7473363876342773, 0.803989052772522, 0.8606417179107666, 0.9172943830490112, 0.9739469885826111, 1.030599594116211, 1.0872522592544556, 1.1439049243927002, 1.2005575895309448, 1.2572102546691895, 1.3138628005981445, 1.3705154657363892, 1.4271681308746338]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 11.0, 12.0, 44.0, 41.0, 73.0, 149.0, 284.0, 931.0, 4438.0, 60018.0, 784877.0, 185853.0, 9443.0, 1491.0, 446.0, 176.0, 96.0, 49.0, 37.0, 21.0, 16.0, 11.0, 8.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.681640625, -1.604034423828125, -1.52642822265625, -1.448822021484375, -1.3712158203125, -1.293609619140625, -1.21600341796875, -1.138397216796875, -1.060791015625, -0.983184814453125, -0.90557861328125, -0.827972412109375, -0.7503662109375, -0.672760009765625, -0.59515380859375, -0.517547607421875, -0.43994140625, -0.362335205078125, -0.28472900390625, -0.207122802734375, -0.1295166015625, -0.051910400390625, 0.02569580078125, 0.103302001953125, 0.180908203125, 0.258514404296875, 0.33612060546875, 0.413726806640625, 0.4913330078125, 0.568939208984375, 0.64654541015625, 0.724151611328125, 0.8017578125, 0.879364013671875, 0.95697021484375, 1.034576416015625, 1.1121826171875, 1.189788818359375, 1.26739501953125, 1.345001220703125, 1.422607421875, 1.500213623046875, 1.57781982421875, 1.655426025390625, 1.7330322265625, 1.810638427734375, 1.88824462890625, 1.965850830078125, 2.04345703125, 2.121063232421875, 2.19866943359375, 2.276275634765625, 2.3538818359375, 2.431488037109375, 2.50909423828125, 2.586700439453125, 2.664306640625, 2.741912841796875, 2.81951904296875, 2.897125244140625, 2.9747314453125, 3.052337646484375, 3.12994384765625, 3.207550048828125, 3.28515625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 6.0, 9.0, 19.0, 15.0, 26.0, 24.0, 27.0, 53.0, 49.0, 44.0, 50.0, 57.0, 58.0, 66.0, 55.0, 50.0, 48.0, 40.0, 47.0, 45.0, 41.0, 43.0, 23.0, 20.0, 14.0, 13.0, 11.0, 10.0, 10.0, 8.0, 1.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.324462890625, -0.3163471221923828, -0.3082313537597656, -0.30011558532714844, -0.29199981689453125, -0.28388404846191406, -0.2757682800292969, -0.2676525115966797, -0.2595367431640625, -0.2514209747314453, -0.24330520629882812, -0.23518943786621094, -0.22707366943359375, -0.21895790100097656, -0.21084213256835938, -0.2027263641357422, -0.194610595703125, -0.1864948272705078, -0.17837905883789062, -0.17026329040527344, -0.16214752197265625, -0.15403175354003906, -0.14591598510742188, -0.1378002166748047, -0.1296844482421875, -0.12156867980957031, -0.11345291137695312, -0.10533714294433594, -0.09722137451171875, -0.08910560607910156, -0.08098983764648438, -0.07287406921386719, -0.06475830078125, -0.05664253234863281, -0.048526763916015625, -0.04041099548339844, -0.03229522705078125, -0.024179458618164062, -0.016063690185546875, -0.007947921752929688, 0.0001678466796875, 0.008283615112304688, 0.016399383544921875, 0.024515151977539062, 0.03263092041015625, 0.04074668884277344, 0.048862457275390625, 0.05697822570800781, 0.065093994140625, 0.07320976257324219, 0.08132553100585938, 0.08944129943847656, 0.09755706787109375, 0.10567283630371094, 0.11378860473632812, 0.12190437316894531, 0.1300201416015625, 0.1381359100341797, 0.14625167846679688, 0.15436744689941406, 0.16248321533203125, 0.17059898376464844, 0.17871475219726562, 0.1868305206298828, 0.1949462890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 12.0, 5.0, 5.0, 13.0, 13.0, 19.0, 28.0, 45.0, 51.0, 93.0, 137.0, 167.0, 279.0, 431.0, 740.0, 1432.0, 3328.0, 8900.0, 31183.0, 127677.0, 440195.0, 323096.0, 78818.0, 20176.0, 6400.0, 2446.0, 1151.0, 587.0, 387.0, 214.0, 137.0, 107.0, 91.0, 55.0, 46.0, 26.0, 13.0, 13.0, 11.0, 6.0, 3.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.9423828125, -0.9136810302734375, -0.884979248046875, -0.8562774658203125, -0.82757568359375, -0.7988739013671875, -0.770172119140625, -0.7414703369140625, -0.7127685546875, -0.6840667724609375, -0.655364990234375, -0.6266632080078125, -0.59796142578125, -0.5692596435546875, -0.540557861328125, -0.5118560791015625, -0.483154296875, -0.4544525146484375, -0.425750732421875, -0.3970489501953125, -0.36834716796875, -0.3396453857421875, -0.310943603515625, -0.2822418212890625, -0.2535400390625, -0.2248382568359375, -0.196136474609375, -0.1674346923828125, -0.13873291015625, -0.1100311279296875, -0.081329345703125, -0.0526275634765625, -0.02392578125, 0.0047760009765625, 0.033477783203125, 0.0621795654296875, 0.09088134765625, 0.1195831298828125, 0.148284912109375, 0.1769866943359375, 0.2056884765625, 0.2343902587890625, 0.263092041015625, 0.2917938232421875, 0.32049560546875, 0.3491973876953125, 0.377899169921875, 0.4066009521484375, 0.435302734375, 0.4640045166015625, 0.492706298828125, 0.5214080810546875, 0.55010986328125, 0.5788116455078125, 0.607513427734375, 0.6362152099609375, 0.6649169921875, 0.6936187744140625, 0.722320556640625, 0.7510223388671875, 0.77972412109375, 0.8084259033203125, 0.837127685546875, 0.8658294677734375, 0.89453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 4.0, 6.0, 13.0, 24.0, 21.0, 22.0, 32.0, 29.0, 43.0, 44.0, 62.0, 56.0, 64.0, 60.0, 51.0, 58.0, 40.0, 64.0, 41.0, 38.0, 25.0, 35.0, 28.0, 28.0, 21.0, 15.0, 11.0, 18.0, 9.0, 5.0, 6.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.0169525146484375, -0.977264404296875, -0.9375762939453125, -0.89788818359375, -0.8582000732421875, -0.818511962890625, -0.7788238525390625, -0.7391357421875, -0.6994476318359375, -0.659759521484375, -0.6200714111328125, -0.58038330078125, -0.5406951904296875, -0.501007080078125, -0.4613189697265625, -0.421630859375, -0.3819427490234375, -0.342254638671875, -0.3025665283203125, -0.26287841796875, -0.2231903076171875, -0.183502197265625, -0.1438140869140625, -0.1041259765625, -0.0644378662109375, -0.024749755859375, 0.0149383544921875, 0.05462646484375, 0.0943145751953125, 0.134002685546875, 0.1736907958984375, 0.21337890625, 0.2530670166015625, 0.292755126953125, 0.3324432373046875, 0.37213134765625, 0.4118194580078125, 0.451507568359375, 0.4911956787109375, 0.5308837890625, 0.5705718994140625, 0.610260009765625, 0.6499481201171875, 0.68963623046875, 0.7293243408203125, 0.769012451171875, 0.8087005615234375, 0.848388671875, 0.8880767822265625, 0.927764892578125, 0.9674530029296875, 1.00714111328125, 1.0468292236328125, 1.086517333984375, 1.1262054443359375, 1.1658935546875, 1.2055816650390625, 1.245269775390625, 1.2849578857421875, 1.32464599609375, 1.3643341064453125, 1.404022216796875, 1.4437103271484375, 1.4833984375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 16.0, 11.0, 31.0, 26.0, 50.0, 66.0, 105.0, 183.0, 339.0, 707.0, 1606.0, 4135.0, 15294.0, 98310.0, 635416.0, 251044.0, 30160.0, 6753.0, 2284.0, 914.0, 475.0, 238.0, 120.0, 83.0, 46.0, 31.0, 19.0, 14.0, 18.0, 8.0, 8.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.6474609375, -0.6256637573242188, -0.6038665771484375, -0.5820693969726562, -0.560272216796875, -0.5384750366210938, -0.5166778564453125, -0.49488067626953125, -0.47308349609375, -0.45128631591796875, -0.4294891357421875, -0.40769195556640625, -0.385894775390625, -0.36409759521484375, -0.3423004150390625, -0.32050323486328125, -0.2987060546875, -0.27690887451171875, -0.2551116943359375, -0.23331451416015625, -0.211517333984375, -0.18972015380859375, -0.1679229736328125, -0.14612579345703125, -0.12432861328125, -0.10253143310546875, -0.0807342529296875, -0.05893707275390625, -0.037139892578125, -0.01534271240234375, 0.0064544677734375, 0.02825164794921875, 0.050048828125, 0.07184600830078125, 0.0936431884765625, 0.11544036865234375, 0.137237548828125, 0.15903472900390625, 0.1808319091796875, 0.20262908935546875, 0.22442626953125, 0.24622344970703125, 0.2680206298828125, 0.28981781005859375, 0.311614990234375, 0.33341217041015625, 0.3552093505859375, 0.37700653076171875, 0.3988037109375, 0.42060089111328125, 0.4423980712890625, 0.46419525146484375, 0.485992431640625, 0.5077896118164062, 0.5295867919921875, 0.5513839721679688, 0.57318115234375, 0.5949783325195312, 0.6167755126953125, 0.6385726928710938, 0.660369873046875, 0.6821670532226562, 0.7039642333984375, 0.7257614135742188, 0.74755859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 10.0, 7.0, 10.0, 22.0, 29.0, 28.0, 37.0, 35.0, 43.0, 73.0, 62.0, 86.0, 103.0, 74.0, 73.0, 60.0, 55.0, 47.0, 33.0, 26.0, 23.0, 12.0, 5.0, 12.0, 6.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.279085159301758e-05, -8.021295070648193e-05, -7.763504981994629e-05, -7.505714893341064e-05, -7.2479248046875e-05, -6.990134716033936e-05, -6.732344627380371e-05, -6.474554538726807e-05, -6.216764450073242e-05, -5.958974361419678e-05, -5.701184272766113e-05, -5.443394184112549e-05, -5.1856040954589844e-05, -4.92781400680542e-05, -4.6700239181518555e-05, -4.412233829498291e-05, -4.1544437408447266e-05, -3.896653652191162e-05, -3.6388635635375977e-05, -3.381073474884033e-05, -3.123283386230469e-05, -2.8654932975769043e-05, -2.60770320892334e-05, -2.3499131202697754e-05, -2.092123031616211e-05, -1.8343329429626465e-05, -1.576542854309082e-05, -1.3187527656555176e-05, -1.0609626770019531e-05, -8.031725883483887e-06, -5.453824996948242e-06, -2.8759241104125977e-06, -2.980232238769531e-07, 2.2798776626586914e-06, 4.857778549194336e-06, 7.4356794357299805e-06, 1.0013580322265625e-05, 1.259148120880127e-05, 1.5169382095336914e-05, 1.774728298187256e-05, 2.0325183868408203e-05, 2.2903084754943848e-05, 2.5480985641479492e-05, 2.8058886528015137e-05, 3.063678741455078e-05, 3.3214688301086426e-05, 3.579258918762207e-05, 3.8370490074157715e-05, 4.094839096069336e-05, 4.3526291847229004e-05, 4.610419273376465e-05, 4.868209362030029e-05, 5.125999450683594e-05, 5.383789539337158e-05, 5.6415796279907227e-05, 5.899369716644287e-05, 6.157159805297852e-05, 6.414949893951416e-05, 6.67273998260498e-05, 6.930530071258545e-05, 7.18832015991211e-05, 7.446110248565674e-05, 7.703900337219238e-05, 7.961690425872803e-05, 8.219480514526367e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 7.0, 14.0, 20.0, 34.0, 44.0, 109.0, 185.0, 461.0, 1311.0, 5401.0, 40717.0, 587404.0, 382345.0, 24939.0, 3840.0, 978.0, 385.0, 163.0, 77.0, 42.0, 33.0, 23.0, 8.0, 12.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.89013671875, -0.8622283935546875, -0.834320068359375, -0.8064117431640625, -0.77850341796875, -0.7505950927734375, -0.722686767578125, -0.6947784423828125, -0.6668701171875, -0.6389617919921875, -0.611053466796875, -0.5831451416015625, -0.55523681640625, -0.5273284912109375, -0.499420166015625, -0.4715118408203125, -0.443603515625, -0.4156951904296875, -0.387786865234375, -0.3598785400390625, -0.33197021484375, -0.3040618896484375, -0.276153564453125, -0.2482452392578125, -0.2203369140625, -0.1924285888671875, -0.164520263671875, -0.1366119384765625, -0.10870361328125, -0.0807952880859375, -0.052886962890625, -0.0249786376953125, 0.0029296875, 0.0308380126953125, 0.058746337890625, 0.0866546630859375, 0.11456298828125, 0.1424713134765625, 0.170379638671875, 0.1982879638671875, 0.2261962890625, 0.2541046142578125, 0.282012939453125, 0.3099212646484375, 0.33782958984375, 0.3657379150390625, 0.393646240234375, 0.4215545654296875, 0.449462890625, 0.4773712158203125, 0.505279541015625, 0.5331878662109375, 0.56109619140625, 0.5890045166015625, 0.616912841796875, 0.6448211669921875, 0.6727294921875, 0.7006378173828125, 0.728546142578125, 0.7564544677734375, 0.78436279296875, 0.8122711181640625, 0.840179443359375, 0.8680877685546875, 0.89599609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 5.0, 6.0, 9.0, 19.0, 18.0, 27.0, 27.0, 36.0, 41.0, 52.0, 62.0, 78.0, 96.0, 87.0, 70.0, 67.0, 55.0, 42.0, 43.0, 28.0, 26.0, 12.0, 18.0, 16.0, 11.0, 7.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.51904296875, -0.5043144226074219, -0.48958587646484375, -0.4748573303222656, -0.4601287841796875, -0.4454002380371094, -0.43067169189453125, -0.4159431457519531, -0.401214599609375, -0.3864860534667969, -0.37175750732421875, -0.3570289611816406, -0.3423004150390625, -0.3275718688964844, -0.31284332275390625, -0.2981147766113281, -0.28338623046875, -0.2686576843261719, -0.25392913818359375, -0.23920059204101562, -0.2244720458984375, -0.20974349975585938, -0.19501495361328125, -0.18028640747070312, -0.165557861328125, -0.15082931518554688, -0.13610076904296875, -0.12137222290039062, -0.1066436767578125, -0.09191513061523438, -0.07718658447265625, -0.062458038330078125, -0.0477294921875, -0.033000946044921875, -0.01827239990234375, -0.003543853759765625, 0.0111846923828125, 0.025913238525390625, 0.04064178466796875, 0.055370330810546875, 0.070098876953125, 0.08482742309570312, 0.09955596923828125, 0.11428451538085938, 0.1290130615234375, 0.14374160766601562, 0.15847015380859375, 0.17319869995117188, 0.18792724609375, 0.20265579223632812, 0.21738433837890625, 0.23211288452148438, 0.2468414306640625, 0.2615699768066406, 0.27629852294921875, 0.2910270690917969, 0.305755615234375, 0.3204841613769531, 0.33521270751953125, 0.3499412536621094, 0.3646697998046875, 0.3793983459472656, 0.39412689208984375, 0.4088554382324219, 0.423583984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 19.0, 58.0, 179.0, 285.0, 288.0, 120.0, 37.0, 15.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.48061752319336, -26.85401725769043, -26.227418899536133, -25.600818634033203, -24.974220275878906, -24.347620010375977, -23.72102165222168, -23.09442138671875, -22.467823028564453, -21.841222763061523, -21.214624404907227, -20.588024139404297, -19.96142578125, -19.33482551574707, -18.708227157592773, -18.081626892089844, -17.455026626586914, -16.828426361083984, -16.201828002929688, -15.575228691101074, -14.948629379272461, -14.322029113769531, -13.695429801940918, -13.068830490112305, -12.442231178283691, -11.815631866455078, -11.189032554626465, -10.562433242797852, -9.935832977294922, -9.309234619140625, -8.682634353637695, -8.056035041809082, -7.429435729980469, -6.8028364181518555, -6.176237106323242, -5.549637317657471, -4.923038005828857, -4.296438694000244, -3.6698391437530518, -3.0432395935058594, -2.416640281677246, -1.7900408506393433, -1.1634414196014404, -0.5368419885635376, 0.08975744247436523, 0.7163567543029785, 1.342956304550171, 1.9695558547973633, 2.5961551666259766, 3.22275447845459, 3.8493540287017822, 4.475953578948975, 5.102552890777588, 5.729152202606201, 6.355751991271973, 6.982351303100586, 7.608950614929199, 8.235549926757812, 8.862149238586426, 9.488748550415039, 10.115348815917969, 10.741947174072266, 11.368547439575195, 11.995146751403809, 12.621746063232422]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 2.0, 5.0, 12.0, 9.0, 14.0, 18.0, 23.0, 13.0, 13.0, 21.0, 34.0, 26.0, 41.0, 36.0, 38.0, 43.0, 48.0, 41.0, 47.0, 55.0, 46.0, 52.0, 43.0, 37.0, 41.0, 31.0, 31.0, 24.0, 18.0, 23.0, 18.0, 22.0, 8.0, 12.0, 12.0, 6.0, 10.0, 6.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.342444896697998, -5.167723178863525, -4.993001461029053, -4.81827974319458, -4.643557548522949, -4.468835830688477, -4.294114112854004, -4.119392395019531, -3.9446706771850586, -3.769948959350586, -3.5952272415161133, -3.4205052852630615, -3.245783567428589, -3.071061849594116, -2.8963398933410645, -2.721618175506592, -2.546896457672119, -2.3721747398376465, -2.197453022003174, -2.022731065750122, -1.8480093479156494, -1.6732876300811768, -1.4985657930374146, -1.3238439559936523, -1.1491222381591797, -0.9744004607200623, -0.7996786832809448, -0.6249569058418274, -0.45023512840270996, -0.27551335096359253, -0.1007915735244751, 0.07393026351928711, 0.24865198135375977, 0.4233737587928772, 0.5980955362319946, 0.7728173136711121, 0.9475390911102295, 1.1222608089447021, 1.2969826459884644, 1.4717044830322266, 1.6464262008666992, 1.8211479187011719, 1.995869755744934, 2.1705915927886963, 2.345313310623169, 2.5200350284576416, 2.6947569847106934, 2.869478702545166, 3.0442004203796387, 3.2189221382141113, 3.393643856048584, 3.5683658123016357, 3.7430875301361084, 3.917809247970581, 4.092531204223633, 4.2672529220581055, 4.441974639892578, 4.616696357727051, 4.791418075561523, 4.966139793395996, 5.140861511230469, 5.3155837059021, 5.490305423736572, 5.665027141571045, 5.839748859405518]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 6.0, 8.0, 2.0, 12.0, 13.0, 15.0, 15.0, 45.0, 78.0, 184.0, 549.0, 2347.0, 23426.0, 4143215.0, 21234.0, 2245.0, 535.0, 165.0, 70.0, 41.0, 27.0, 15.0, 8.0, 9.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.02734375, -3.916961669921875, -3.80657958984375, -3.696197509765625, -3.5858154296875, -3.475433349609375, -3.36505126953125, -3.254669189453125, -3.144287109375, -3.033905029296875, -2.92352294921875, -2.813140869140625, -2.7027587890625, -2.592376708984375, -2.48199462890625, -2.371612548828125, -2.26123046875, -2.150848388671875, -2.04046630859375, -1.930084228515625, -1.8197021484375, -1.709320068359375, -1.59893798828125, -1.488555908203125, -1.378173828125, -1.267791748046875, -1.15740966796875, -1.047027587890625, -0.9366455078125, -0.826263427734375, -0.71588134765625, -0.605499267578125, -0.4951171875, -0.384735107421875, -0.27435302734375, -0.163970947265625, -0.0535888671875, 0.056793212890625, 0.16717529296875, 0.277557373046875, 0.387939453125, 0.498321533203125, 0.60870361328125, 0.719085693359375, 0.8294677734375, 0.939849853515625, 1.05023193359375, 1.160614013671875, 1.27099609375, 1.381378173828125, 1.49176025390625, 1.602142333984375, 1.7125244140625, 1.822906494140625, 1.93328857421875, 2.043670654296875, 2.154052734375, 2.264434814453125, 2.37481689453125, 2.485198974609375, 2.5955810546875, 2.705963134765625, 2.81634521484375, 2.926727294921875, 3.037109375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 12.0, 7.0, 11.0, 17.0, 31.0, 23.0, 43.0, 43.0, 40.0, 44.0, 56.0, 63.0, 78.0, 47.0, 51.0, 56.0, 40.0, 58.0, 45.0, 51.0, 28.0, 29.0, 21.0, 19.0, 20.0, 23.0, 13.0, 4.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324462890625, -0.3150978088378906, -0.30573272705078125, -0.2963676452636719, -0.2870025634765625, -0.2776374816894531, -0.26827239990234375, -0.2589073181152344, -0.249542236328125, -0.24017715454101562, -0.23081207275390625, -0.22144699096679688, -0.2120819091796875, -0.20271682739257812, -0.19335174560546875, -0.18398666381835938, -0.17462158203125, -0.16525650024414062, -0.15589141845703125, -0.14652633666992188, -0.1371612548828125, -0.12779617309570312, -0.11843109130859375, -0.10906600952148438, -0.099700927734375, -0.09033584594726562, -0.08097076416015625, -0.07160568237304688, -0.0622406005859375, -0.052875518798828125, -0.04351043701171875, -0.034145355224609375, -0.0247802734375, -0.015415191650390625, -0.00605010986328125, 0.003314971923828125, 0.0126800537109375, 0.022045135498046875, 0.03141021728515625, 0.040775299072265625, 0.050140380859375, 0.059505462646484375, 0.06887054443359375, 0.07823562622070312, 0.0876007080078125, 0.09696578979492188, 0.10633087158203125, 0.11569595336914062, 0.12506103515625, 0.13442611694335938, 0.14379119873046875, 0.15315628051757812, 0.1625213623046875, 0.17188644409179688, 0.18125152587890625, 0.19061660766601562, 0.199981689453125, 0.20934677124023438, 0.21871185302734375, 0.22807693481445312, 0.2374420166015625, 0.24680709838867188, 0.25617218017578125, 0.2655372619628906, 0.27490234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 2.0, 8.0, 11.0, 14.0, 18.0, 14.0, 35.0, 38.0, 73.0, 91.0, 145.0, 245.0, 424.0, 737.0, 1322.0, 2755.0, 5640.0, 13345.0, 45302.0, 3716111.0, 355705.0, 31970.0, 10579.0, 4707.0, 2249.0, 1134.0, 634.0, 358.0, 221.0, 122.0, 64.0, 35.0, 46.0, 40.0, 15.0, 19.0, 9.0, 9.0, 7.0, 3.0, 8.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8994140625, -0.8712005615234375, -0.842987060546875, -0.8147735595703125, -0.78656005859375, -0.7583465576171875, -0.730133056640625, -0.7019195556640625, -0.6737060546875, -0.6454925537109375, -0.617279052734375, -0.5890655517578125, -0.56085205078125, -0.5326385498046875, -0.504425048828125, -0.4762115478515625, -0.447998046875, -0.4197845458984375, -0.391571044921875, -0.3633575439453125, -0.33514404296875, -0.3069305419921875, -0.278717041015625, -0.2505035400390625, -0.2222900390625, -0.1940765380859375, -0.165863037109375, -0.1376495361328125, -0.10943603515625, -0.0812225341796875, -0.053009033203125, -0.0247955322265625, 0.00341796875, 0.0316314697265625, 0.059844970703125, 0.0880584716796875, 0.11627197265625, 0.1444854736328125, 0.172698974609375, 0.2009124755859375, 0.2291259765625, 0.2573394775390625, 0.285552978515625, 0.3137664794921875, 0.34197998046875, 0.3701934814453125, 0.398406982421875, 0.4266204833984375, 0.454833984375, 0.4830474853515625, 0.511260986328125, 0.5394744873046875, 0.56768798828125, 0.5959014892578125, 0.624114990234375, 0.6523284912109375, 0.6805419921875, 0.7087554931640625, 0.736968994140625, 0.7651824951171875, 0.79339599609375, 0.8216094970703125, 0.849822998046875, 0.8780364990234375, 0.90625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 11.0, 10.0, 16.0, 17.0, 56.0, 227.0, 3362.0, 223.0, 62.0, 28.0, 18.0, 12.0, 6.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.428955078125, -0.4195270538330078, -0.4100990295410156, -0.40067100524902344, -0.39124298095703125, -0.38181495666503906, -0.3723869323730469, -0.3629589080810547, -0.3535308837890625, -0.3441028594970703, -0.3346748352050781, -0.32524681091308594, -0.31581878662109375, -0.30639076232910156, -0.2969627380371094, -0.2875347137451172, -0.278106689453125, -0.2686786651611328, -0.2592506408691406, -0.24982261657714844, -0.24039459228515625, -0.23096656799316406, -0.22153854370117188, -0.2121105194091797, -0.2026824951171875, -0.1932544708251953, -0.18382644653320312, -0.17439842224121094, -0.16497039794921875, -0.15554237365722656, -0.14611434936523438, -0.1366863250732422, -0.12725830078125, -0.11783027648925781, -0.10840225219726562, -0.09897422790527344, -0.08954620361328125, -0.08011817932128906, -0.07069015502929688, -0.06126213073730469, -0.0518341064453125, -0.04240608215332031, -0.032978057861328125, -0.023550033569335938, -0.01412200927734375, -0.0046939849853515625, 0.004734039306640625, 0.014162063598632812, 0.023590087890625, 0.03301811218261719, 0.042446136474609375, 0.05187416076660156, 0.06130218505859375, 0.07073020935058594, 0.08015823364257812, 0.08958625793457031, 0.0990142822265625, 0.10844230651855469, 0.11787033081054688, 0.12729835510253906, 0.13672637939453125, 0.14615440368652344, 0.15558242797851562, 0.1650104522705078, 0.1744384765625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 17.0, 77.0, 220.0, 305.0, 227.0, 113.0, 26.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7380779385566711, -0.6724780201911926, -0.6068781018257141, -0.5412781834602356, -0.4756782650947571, -0.41007834672927856, -0.34447842836380005, -0.27887850999832153, -0.21327859163284302, -0.1476786732673645, -0.08207875490188599, -0.01647883653640747, 0.049121081829071045, 0.11472100019454956, 0.18032091856002808, 0.2459208369255066, 0.3115207552909851, 0.3771206736564636, 0.44272059202194214, 0.5083205103874207, 0.5739204287528992, 0.6395203471183777, 0.7051202654838562, 0.7707201838493347, 0.8363201022148132, 0.9019200205802917, 0.9675199389457703, 1.0331199169158936, 1.098719835281372, 1.1643197536468506, 1.229919672012329, 1.2955195903778076, 1.3611195087432861, 1.4267194271087646, 1.4923193454742432, 1.5579192638397217, 1.6235191822052002, 1.6891191005706787, 1.7547190189361572, 1.8203189373016357, 1.8859188556671143, 1.9515187740325928, 2.0171186923980713, 2.08271861076355, 2.1483185291290283, 2.213918447494507, 2.2795183658599854, 2.345118284225464, 2.4107182025909424, 2.476318120956421, 2.5419180393218994, 2.607517957687378, 2.6731178760528564, 2.738717794418335, 2.8043177127838135, 2.869917631149292, 2.9355175495147705, 3.001117467880249, 3.0667173862457275, 3.132317304611206, 3.1979172229766846, 3.263517141342163, 3.3291170597076416, 3.39471697807312, 3.4603168964385986]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 1.0, 5.0, 4.0, 8.0, 8.0, 7.0, 12.0, 10.0, 22.0, 22.0, 25.0, 25.0, 32.0, 33.0, 36.0, 31.0, 39.0, 41.0, 35.0, 52.0, 50.0, 41.0, 39.0, 37.0, 40.0, 31.0, 42.0, 42.0, 29.0, 34.0, 29.0, 19.0, 20.0, 13.0, 15.0, 14.0, 12.0, 9.0, 11.0, 12.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.5773084759712219, -0.5618777275085449, -0.5464469790458679, -0.5310162305831909, -0.5155854225158691, -0.5001546740531921, -0.48472392559051514, -0.46929317712783813, -0.45386242866516113, -0.43843168020248413, -0.42300093173980713, -0.40757015347480774, -0.39213940501213074, -0.37670865654945374, -0.36127787828445435, -0.34584712982177734, -0.33041638135910034, -0.31498563289642334, -0.29955488443374634, -0.28412410616874695, -0.26869335770606995, -0.25326260924339294, -0.23783184587955475, -0.22240108251571655, -0.20697033405303955, -0.19153958559036255, -0.17610882222652435, -0.16067805886268616, -0.14524731040000916, -0.12981656193733215, -0.11438579857349396, -0.09895504266023636, -0.08352428674697876, -0.06809353083372116, -0.05266277492046356, -0.03723201900720596, -0.021801263093948364, -0.006370507180690765, 0.009060248732566833, 0.024491004645824432, 0.03992176055908203, 0.05535251647233963, 0.07078327238559723, 0.08621402829885483, 0.10164478421211243, 0.11707554012537003, 0.13250629603862762, 0.14793705940246582, 0.16336780786514282, 0.17879855632781982, 0.19422931969165802, 0.20966008305549622, 0.22509083151817322, 0.24052157998085022, 0.2559523582458496, 0.2713831067085266, 0.2868138551712036, 0.3022446036338806, 0.3176753520965576, 0.333106130361557, 0.348536878824234, 0.363967627286911, 0.3793984055519104, 0.3948291540145874, 0.4102599024772644]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 8.0, 6.0, 10.0, 10.0, 21.0, 31.0, 53.0, 68.0, 104.0, 222.0, 461.0, 1440.0, 5779.0, 37468.0, 322714.0, 567646.0, 96527.0, 12112.0, 2440.0, 731.0, 340.0, 131.0, 84.0, 41.0, 39.0, 24.0, 8.0, 15.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.84375, -1.788238525390625, -1.73272705078125, -1.677215576171875, -1.6217041015625, -1.566192626953125, -1.51068115234375, -1.455169677734375, -1.399658203125, -1.344146728515625, -1.28863525390625, -1.233123779296875, -1.1776123046875, -1.122100830078125, -1.06658935546875, -1.011077880859375, -0.95556640625, -0.900054931640625, -0.84454345703125, -0.789031982421875, -0.7335205078125, -0.678009033203125, -0.62249755859375, -0.566986083984375, -0.511474609375, -0.455963134765625, -0.40045166015625, -0.344940185546875, -0.2894287109375, -0.233917236328125, -0.17840576171875, -0.122894287109375, -0.0673828125, -0.011871337890625, 0.04364013671875, 0.099151611328125, 0.1546630859375, 0.210174560546875, 0.26568603515625, 0.321197509765625, 0.376708984375, 0.432220458984375, 0.48773193359375, 0.543243408203125, 0.5987548828125, 0.654266357421875, 0.70977783203125, 0.765289306640625, 0.82080078125, 0.876312255859375, 0.93182373046875, 0.987335205078125, 1.0428466796875, 1.098358154296875, 1.15386962890625, 1.209381103515625, 1.264892578125, 1.320404052734375, 1.37591552734375, 1.431427001953125, 1.4869384765625, 1.542449951171875, 1.59796142578125, 1.653472900390625, 1.708984375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 4.0, 6.0, 12.0, 11.0, 16.0, 23.0, 25.0, 39.0, 33.0, 31.0, 33.0, 40.0, 50.0, 49.0, 48.0, 72.0, 40.0, 54.0, 44.0, 49.0, 40.0, 36.0, 38.0, 37.0, 28.0, 25.0, 23.0, 18.0, 19.0, 10.0, 16.0, 6.0, 8.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.319091796875, -0.3104724884033203, -0.3018531799316406, -0.29323387145996094, -0.28461456298828125, -0.27599525451660156, -0.2673759460449219, -0.2587566375732422, -0.2501373291015625, -0.2415180206298828, -0.23289871215820312, -0.22427940368652344, -0.21566009521484375, -0.20704078674316406, -0.19842147827148438, -0.1898021697998047, -0.181182861328125, -0.1725635528564453, -0.16394424438476562, -0.15532493591308594, -0.14670562744140625, -0.13808631896972656, -0.12946701049804688, -0.12084770202636719, -0.1122283935546875, -0.10360908508300781, -0.09498977661132812, -0.08637046813964844, -0.07775115966796875, -0.06913185119628906, -0.060512542724609375, -0.05189323425292969, -0.04327392578125, -0.03465461730957031, -0.026035308837890625, -0.017416000366210938, -0.00879669189453125, -0.0001773834228515625, 0.008441925048828125, 0.017061233520507812, 0.0256805419921875, 0.03429985046386719, 0.042919158935546875, 0.05153846740722656, 0.06015777587890625, 0.06877708435058594, 0.07739639282226562, 0.08601570129394531, 0.094635009765625, 0.10325431823730469, 0.11187362670898438, 0.12049293518066406, 0.12911224365234375, 0.13773155212402344, 0.14635086059570312, 0.1549701690673828, 0.1635894775390625, 0.1722087860107422, 0.18082809448242188, 0.18944740295410156, 0.19806671142578125, 0.20668601989746094, 0.21530532836914062, 0.2239246368408203, 0.2325439453125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 5.0, 6.0, 10.0, 9.0, 20.0, 32.0, 36.0, 57.0, 73.0, 130.0, 207.0, 320.0, 697.0, 1553.0, 4919.0, 21906.0, 149015.0, 631015.0, 200586.0, 28424.0, 5897.0, 1837.0, 796.0, 378.0, 213.0, 129.0, 101.0, 77.0, 35.0, 23.0, 21.0, 9.0, 5.0, 3.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2294921875, -1.18646240234375, -1.1434326171875, -1.10040283203125, -1.057373046875, -1.01434326171875, -0.9713134765625, -0.92828369140625, -0.88525390625, -0.84222412109375, -0.7991943359375, -0.75616455078125, -0.713134765625, -0.67010498046875, -0.6270751953125, -0.58404541015625, -0.541015625, -0.49798583984375, -0.4549560546875, -0.41192626953125, -0.368896484375, -0.32586669921875, -0.2828369140625, -0.23980712890625, -0.19677734375, -0.15374755859375, -0.1107177734375, -0.06768798828125, -0.024658203125, 0.01837158203125, 0.0614013671875, 0.10443115234375, 0.1474609375, 0.19049072265625, 0.2335205078125, 0.27655029296875, 0.319580078125, 0.36260986328125, 0.4056396484375, 0.44866943359375, 0.49169921875, 0.53472900390625, 0.5777587890625, 0.62078857421875, 0.663818359375, 0.70684814453125, 0.7498779296875, 0.79290771484375, 0.8359375, 0.87896728515625, 0.9219970703125, 0.96502685546875, 1.008056640625, 1.05108642578125, 1.0941162109375, 1.13714599609375, 1.18017578125, 1.22320556640625, 1.2662353515625, 1.30926513671875, 1.352294921875, 1.39532470703125, 1.4383544921875, 1.48138427734375, 1.5244140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 4.0, 9.0, 6.0, 10.0, 12.0, 14.0, 18.0, 18.0, 31.0, 19.0, 21.0, 27.0, 34.0, 42.0, 36.0, 34.0, 45.0, 56.0, 52.0, 43.0, 47.0, 39.0, 37.0, 29.0, 48.0, 30.0, 31.0, 25.0, 32.0, 29.0, 20.0, 16.0, 20.0, 16.0, 9.0, 6.0, 6.0, 4.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.2685546875, -1.2338943481445312, -1.1992340087890625, -1.1645736694335938, -1.129913330078125, -1.0952529907226562, -1.0605926513671875, -1.0259323120117188, -0.99127197265625, -0.9566116333007812, -0.9219512939453125, -0.8872909545898438, -0.852630615234375, -0.8179702758789062, -0.7833099365234375, -0.7486495971679688, -0.7139892578125, -0.6793289184570312, -0.6446685791015625, -0.6100082397460938, -0.575347900390625, -0.5406875610351562, -0.5060272216796875, -0.47136688232421875, -0.43670654296875, -0.40204620361328125, -0.3673858642578125, -0.33272552490234375, -0.298065185546875, -0.26340484619140625, -0.2287445068359375, -0.19408416748046875, -0.159423828125, -0.12476348876953125, -0.0901031494140625, -0.05544281005859375, -0.020782470703125, 0.01387786865234375, 0.0485382080078125, 0.08319854736328125, 0.11785888671875, 0.15251922607421875, 0.1871795654296875, 0.22183990478515625, 0.256500244140625, 0.29116058349609375, 0.3258209228515625, 0.36048126220703125, 0.3951416015625, 0.42980194091796875, 0.4644622802734375, 0.49912261962890625, 0.533782958984375, 0.5684432983398438, 0.6031036376953125, 0.6377639770507812, 0.67242431640625, 0.7070846557617188, 0.7417449951171875, 0.7764053344726562, 0.811065673828125, 0.8457260131835938, 0.8803863525390625, 0.9150466918945312, 0.94970703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 8.0, 12.0, 5.0, 12.0, 14.0, 24.0, 27.0, 40.0, 53.0, 59.0, 93.0, 140.0, 221.0, 354.0, 656.0, 1548.0, 5648.0, 61164.0, 922030.0, 48167.0, 5045.0, 1551.0, 638.0, 365.0, 182.0, 128.0, 93.0, 61.0, 56.0, 32.0, 26.0, 25.0, 21.0, 7.0, 8.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6806640625, -1.6304473876953125, -1.580230712890625, -1.5300140380859375, -1.47979736328125, -1.4295806884765625, -1.379364013671875, -1.3291473388671875, -1.2789306640625, -1.2287139892578125, -1.178497314453125, -1.1282806396484375, -1.07806396484375, -1.0278472900390625, -0.977630615234375, -0.9274139404296875, -0.877197265625, -0.8269805908203125, -0.776763916015625, -0.7265472412109375, -0.67633056640625, -0.6261138916015625, -0.575897216796875, -0.5256805419921875, -0.4754638671875, -0.4252471923828125, -0.375030517578125, -0.3248138427734375, -0.27459716796875, -0.2243804931640625, -0.174163818359375, -0.1239471435546875, -0.07373046875, -0.0235137939453125, 0.026702880859375, 0.0769195556640625, 0.12713623046875, 0.1773529052734375, 0.227569580078125, 0.2777862548828125, 0.3280029296875, 0.3782196044921875, 0.428436279296875, 0.4786529541015625, 0.52886962890625, 0.5790863037109375, 0.629302978515625, 0.6795196533203125, 0.729736328125, 0.7799530029296875, 0.830169677734375, 0.8803863525390625, 0.93060302734375, 0.9808197021484375, 1.031036376953125, 1.0812530517578125, 1.1314697265625, 1.1816864013671875, 1.231903076171875, 1.2821197509765625, 1.33233642578125, 1.3825531005859375, 1.432769775390625, 1.4829864501953125, 1.533203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 4.0, 13.0, 10.0, 17.0, 47.0, 84.0, 86.0, 115.0, 171.0, 143.0, 114.0, 70.0, 54.0, 29.0, 24.0, 14.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011461973190307617, -0.0001095188781619072, -0.00010441802442073822, -9.931717067956924e-05, -9.421631693840027e-05, -8.911546319723129e-05, -8.401460945606232e-05, -7.891375571489334e-05, -7.381290197372437e-05, -6.871204823255539e-05, -6.361119449138641e-05, -5.851034075021744e-05, -5.340948700904846e-05, -4.8308633267879486e-05, -4.320777952671051e-05, -3.8106925785541534e-05, -3.300607204437256e-05, -2.7905218303203583e-05, -2.2804364562034607e-05, -1.770351082086563e-05, -1.2602657079696655e-05, -7.5018033385276794e-06, -2.4009495973587036e-06, 2.6999041438102722e-06, 7.800757884979248e-06, 1.2901611626148224e-05, 1.80024653673172e-05, 2.3103319108486176e-05, 2.820417284965515e-05, 3.330502659082413e-05, 3.84058803319931e-05, 4.350673407316208e-05, 4.8607587814331055e-05, 5.370844155550003e-05, 5.8809295296669006e-05, 6.391014903783798e-05, 6.901100277900696e-05, 7.411185652017593e-05, 7.921271026134491e-05, 8.431356400251389e-05, 8.941441774368286e-05, 9.451527148485184e-05, 9.961612522602081e-05, 0.00010471697896718979, 0.00010981783270835876, 0.00011491868644952774, 0.00012001954019069672, 0.0001251203939318657, 0.00013022124767303467, 0.00013532210141420364, 0.00014042295515537262, 0.0001455238088965416, 0.00015062466263771057, 0.00015572551637887955, 0.00016082637012004852, 0.0001659272238612175, 0.00017102807760238647, 0.00017612893134355545, 0.00018122978508472443, 0.0001863306388258934, 0.00019143149256706238, 0.00019653234630823135, 0.00020163320004940033, 0.0002067340537905693, 0.00021183490753173828]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 9.0, 9.0, 16.0, 23.0, 28.0, 47.0, 70.0, 108.0, 238.0, 436.0, 1182.0, 3956.0, 42088.0, 948907.0, 45061.0, 4161.0, 1154.0, 460.0, 253.0, 129.0, 75.0, 44.0, 25.0, 22.0, 15.0, 11.0, 9.0, 5.0, 4.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73828125, -1.681304931640625, -1.62432861328125, -1.567352294921875, -1.5103759765625, -1.453399658203125, -1.39642333984375, -1.339447021484375, -1.282470703125, -1.225494384765625, -1.16851806640625, -1.111541748046875, -1.0545654296875, -0.997589111328125, -0.94061279296875, -0.883636474609375, -0.82666015625, -0.769683837890625, -0.71270751953125, -0.655731201171875, -0.5987548828125, -0.541778564453125, -0.48480224609375, -0.427825927734375, -0.370849609375, -0.313873291015625, -0.25689697265625, -0.199920654296875, -0.1429443359375, -0.085968017578125, -0.02899169921875, 0.027984619140625, 0.0849609375, 0.141937255859375, 0.19891357421875, 0.255889892578125, 0.3128662109375, 0.369842529296875, 0.42681884765625, 0.483795166015625, 0.540771484375, 0.597747802734375, 0.65472412109375, 0.711700439453125, 0.7686767578125, 0.825653076171875, 0.88262939453125, 0.939605712890625, 0.99658203125, 1.053558349609375, 1.11053466796875, 1.167510986328125, 1.2244873046875, 1.281463623046875, 1.33843994140625, 1.395416259765625, 1.452392578125, 1.509368896484375, 1.56634521484375, 1.623321533203125, 1.6802978515625, 1.737274169921875, 1.79425048828125, 1.851226806640625, 1.908203125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 22.0, 58.0, 173.0, 296.0, 248.0, 111.0, 37.0, 13.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96875, -2.8922882080078125, -2.815826416015625, -2.7393646240234375, -2.66290283203125, -2.5864410400390625, -2.509979248046875, -2.4335174560546875, -2.3570556640625, -2.2805938720703125, -2.204132080078125, -2.1276702880859375, -2.05120849609375, -1.9747467041015625, -1.898284912109375, -1.8218231201171875, -1.745361328125, -1.6688995361328125, -1.592437744140625, -1.5159759521484375, -1.43951416015625, -1.3630523681640625, -1.286590576171875, -1.2101287841796875, -1.1336669921875, -1.0572052001953125, -0.980743408203125, -0.9042816162109375, -0.82781982421875, -0.7513580322265625, -0.674896240234375, -0.5984344482421875, -0.52197265625, -0.4455108642578125, -0.369049072265625, -0.2925872802734375, -0.21612548828125, -0.1396636962890625, -0.063201904296875, 0.0132598876953125, 0.0897216796875, 0.1661834716796875, 0.242645263671875, 0.3191070556640625, 0.39556884765625, 0.4720306396484375, 0.548492431640625, 0.6249542236328125, 0.701416015625, 0.7778778076171875, 0.854339599609375, 0.9308013916015625, 1.00726318359375, 1.0837249755859375, 1.160186767578125, 1.2366485595703125, 1.3131103515625, 1.3895721435546875, 1.466033935546875, 1.5424957275390625, 1.61895751953125, 1.6954193115234375, 1.771881103515625, 1.8483428955078125, 1.9248046875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 17.0, 20.0, 18.0, 34.0, 44.0, 56.0, 78.0, 83.0, 96.0, 89.0, 72.0, 75.0, 79.0, 68.0, 38.0, 27.0, 24.0, 18.0, 13.0, 13.0, 9.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.188946723937988, -5.946016311645508, -5.703085899353027, -5.460155010223389, -5.217224597930908, -4.974294185638428, -4.731363296508789, -4.488432884216309, -4.245502471923828, -4.002572059631348, -3.759641408920288, -3.5167107582092285, -3.273780345916748, -3.0308499336242676, -2.787919282913208, -2.5449886322021484, -2.302058219909668, -2.0591278076171875, -1.816197156906128, -1.573266625404358, -1.330336093902588, -1.0874055624008179, -0.8444750308990479, -0.6015444993972778, -0.3586139678955078, -0.11568343639373779, 0.12724709510803223, 0.37017762660980225, 0.6131081581115723, 0.8560386896133423, 1.0989692211151123, 1.3418997526168823, 1.5848302841186523, 1.8277608156204224, 2.0706913471221924, 2.313621997833252, 2.5565524101257324, 2.799482822418213, 3.0424134731292725, 3.285344123840332, 3.5282745361328125, 3.771204948425293, 4.014135360717773, 4.257066249847412, 4.499996662139893, 4.742927074432373, 4.985857963562012, 5.228788375854492, 5.471718788146973, 5.714649200439453, 5.957579612731934, 6.200510501861572, 6.443440914154053, 6.686371326446533, 6.929302215576172, 7.172232627868652, 7.415163040161133, 7.658093452453613, 7.901023864746094, 8.143954277038574, 8.386884689331055, 8.629816055297852, 8.872746467590332, 9.115676879882812, 9.358607292175293]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 11.0, 6.0, 7.0, 12.0, 7.0, 14.0, 10.0, 11.0, 15.0, 15.0, 22.0, 19.0, 32.0, 25.0, 34.0, 20.0, 30.0, 34.0, 44.0, 54.0, 49.0, 33.0, 47.0, 34.0, 41.0, 35.0, 40.0, 37.0, 37.0, 22.0, 27.0, 27.0, 25.0, 13.0, 21.0, 19.0, 12.0, 9.0, 8.0, 6.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.115711212158203, -5.9148054122924805, -5.713899612426758, -5.512993812561035, -5.312088489532471, -5.111182689666748, -4.910276889801025, -4.709371089935303, -4.50846529006958, -4.307559490203857, -4.106653690338135, -3.905748128890991, -3.7048423290252686, -3.503936767578125, -3.3030309677124023, -3.1021251678466797, -2.901219606399536, -2.7003138065338135, -2.49940824508667, -2.2985024452209473, -2.0975966453552246, -1.8966909646987915, -1.6957852840423584, -1.4948794841766357, -1.2939738035202026, -1.0930681228637695, -0.8921623229980469, -0.6912566423416138, -0.4903509020805359, -0.289445161819458, -0.0885394811630249, 0.11236631870269775, 0.31327199935913086, 0.5141777396202087, 0.7150834798812866, 0.9159891605377197, 1.1168949604034424, 1.3178006410598755, 1.5187063217163086, 1.7196121215820312, 1.9205178022384644, 2.1214234828948975, 2.32232928276062, 2.5232348442077637, 2.7241406440734863, 2.925046443939209, 3.1259522438049316, 3.3268580436706543, 3.527763605117798, 3.7286694049835205, 3.929574966430664, 4.130480766296387, 4.331386566162109, 4.532292366027832, 4.733198165893555, 4.934103965759277, 5.135009288787842, 5.3359150886535645, 5.536820888519287, 5.737726211547852, 5.938632011413574, 6.139537811279297, 6.3404436111450195, 6.541349411010742, 6.742255210876465]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 5.0, 8.0, 18.0, 20.0, 66.0, 120.0, 332.0, 1494.0, 18217.0, 4154248.0, 17811.0, 1415.0, 320.0, 104.0, 40.0, 26.0, 16.0, 8.0, 2.0, 6.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.86328125, -4.713623046875, -4.56396484375, -4.414306640625, -4.2646484375, -4.114990234375, -3.96533203125, -3.815673828125, -3.666015625, -3.516357421875, -3.36669921875, -3.217041015625, -3.0673828125, -2.917724609375, -2.76806640625, -2.618408203125, -2.46875, -2.319091796875, -2.16943359375, -2.019775390625, -1.8701171875, -1.720458984375, -1.57080078125, -1.421142578125, -1.271484375, -1.121826171875, -0.97216796875, -0.822509765625, -0.6728515625, -0.523193359375, -0.37353515625, -0.223876953125, -0.07421875, 0.075439453125, 0.22509765625, 0.374755859375, 0.5244140625, 0.674072265625, 0.82373046875, 0.973388671875, 1.123046875, 1.272705078125, 1.42236328125, 1.572021484375, 1.7216796875, 1.871337890625, 2.02099609375, 2.170654296875, 2.3203125, 2.469970703125, 2.61962890625, 2.769287109375, 2.9189453125, 3.068603515625, 3.21826171875, 3.367919921875, 3.517578125, 3.667236328125, 3.81689453125, 3.966552734375, 4.1162109375, 4.265869140625, 4.41552734375, 4.565185546875, 4.71484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 3.0, 12.0, 8.0, 10.0, 15.0, 22.0, 20.0, 22.0, 27.0, 39.0, 42.0, 46.0, 57.0, 53.0, 54.0, 57.0, 68.0, 57.0, 54.0, 44.0, 40.0, 60.0, 28.0, 30.0, 31.0, 21.0, 22.0, 6.0, 10.0, 9.0, 15.0, 1.0, 6.0, 5.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32373046875, -0.3129768371582031, -0.30222320556640625, -0.2914695739746094, -0.2807159423828125, -0.2699623107910156, -0.25920867919921875, -0.24845504760742188, -0.237701416015625, -0.22694778442382812, -0.21619415283203125, -0.20544052124023438, -0.1946868896484375, -0.18393325805664062, -0.17317962646484375, -0.16242599487304688, -0.15167236328125, -0.14091873168945312, -0.13016510009765625, -0.11941146850585938, -0.1086578369140625, -0.09790420532226562, -0.08715057373046875, -0.07639694213867188, -0.065643310546875, -0.054889678955078125, -0.04413604736328125, -0.033382415771484375, -0.0226287841796875, -0.011875152587890625, -0.00112152099609375, 0.009632110595703125, 0.0203857421875, 0.031139373779296875, 0.04189300537109375, 0.052646636962890625, 0.0634002685546875, 0.07415390014648438, 0.08490753173828125, 0.09566116333007812, 0.106414794921875, 0.11716842651367188, 0.12792205810546875, 0.13867568969726562, 0.1494293212890625, 0.16018295288085938, 0.17093658447265625, 0.18169021606445312, 0.19244384765625, 0.20319747924804688, 0.21395111083984375, 0.22470474243164062, 0.2354583740234375, 0.24621200561523438, 0.25696563720703125, 0.2677192687988281, 0.278472900390625, 0.2892265319824219, 0.29998016357421875, 0.3107337951660156, 0.3214874267578125, 0.3322410583496094, 0.34299468994140625, 0.3537483215332031, 0.364501953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 6.0, 9.0, 11.0, 24.0, 34.0, 46.0, 62.0, 80.0, 93.0, 185.0, 264.0, 412.0, 541.0, 834.0, 1339.0, 2209.0, 3597.0, 7278.0, 16084.0, 47382.0, 324438.0, 3642325.0, 99036.0, 25084.0, 10224.0, 4990.0, 2809.0, 1690.0, 1075.0, 661.0, 460.0, 310.0, 211.0, 153.0, 90.0, 58.0, 51.0, 36.0, 24.0, 21.0, 18.0, 6.0, 11.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8447265625, -0.8167877197265625, -0.788848876953125, -0.7609100341796875, -0.73297119140625, -0.7050323486328125, -0.677093505859375, -0.6491546630859375, -0.6212158203125, -0.5932769775390625, -0.565338134765625, -0.5373992919921875, -0.50946044921875, -0.4815216064453125, -0.453582763671875, -0.4256439208984375, -0.397705078125, -0.3697662353515625, -0.341827392578125, -0.3138885498046875, -0.28594970703125, -0.2580108642578125, -0.230072021484375, -0.2021331787109375, -0.1741943359375, -0.1462554931640625, -0.118316650390625, -0.0903778076171875, -0.06243896484375, -0.0345001220703125, -0.006561279296875, 0.0213775634765625, 0.04931640625, 0.0772552490234375, 0.105194091796875, 0.1331329345703125, 0.16107177734375, 0.1890106201171875, 0.216949462890625, 0.2448883056640625, 0.2728271484375, 0.3007659912109375, 0.328704833984375, 0.3566436767578125, 0.38458251953125, 0.4125213623046875, 0.440460205078125, 0.4683990478515625, 0.496337890625, 0.5242767333984375, 0.552215576171875, 0.5801544189453125, 0.60809326171875, 0.6360321044921875, 0.663970947265625, 0.6919097900390625, 0.7198486328125, 0.7477874755859375, 0.775726318359375, 0.8036651611328125, 0.83160400390625, 0.8595428466796875, 0.887481689453125, 0.9154205322265625, 0.943359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 4.0, 5.0, 13.0, 13.0, 30.0, 52.0, 116.0, 319.0, 3034.0, 250.0, 94.0, 46.0, 25.0, 14.0, 9.0, 18.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.375732421875, -0.364166259765625, -0.35260009765625, -0.341033935546875, -0.3294677734375, -0.317901611328125, -0.30633544921875, -0.294769287109375, -0.283203125, -0.271636962890625, -0.26007080078125, -0.248504638671875, -0.2369384765625, -0.225372314453125, -0.21380615234375, -0.202239990234375, -0.190673828125, -0.179107666015625, -0.16754150390625, -0.155975341796875, -0.1444091796875, -0.132843017578125, -0.12127685546875, -0.109710693359375, -0.09814453125, -0.086578369140625, -0.07501220703125, -0.063446044921875, -0.0518798828125, -0.040313720703125, -0.02874755859375, -0.017181396484375, -0.005615234375, 0.005950927734375, 0.01751708984375, 0.029083251953125, 0.0406494140625, 0.052215576171875, 0.06378173828125, 0.075347900390625, 0.0869140625, 0.098480224609375, 0.11004638671875, 0.121612548828125, 0.1331787109375, 0.144744873046875, 0.15631103515625, 0.167877197265625, 0.179443359375, 0.191009521484375, 0.20257568359375, 0.214141845703125, 0.2257080078125, 0.237274169921875, 0.24884033203125, 0.260406494140625, 0.27197265625, 0.283538818359375, 0.29510498046875, 0.306671142578125, 0.3182373046875, 0.329803466796875, 0.34136962890625, 0.352935791015625, 0.364501953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 15.0, 74.0, 280.0, 433.0, 172.0, 27.0, 9.0, 4.0], "bins": [-9.228479385375977, -9.073238372802734, -8.917998313903809, -8.762757301330566, -8.607516288757324, -8.452276229858398, -8.297035217285156, -8.141794204711914, -7.98655366897583, -7.831313133239746, -7.676072120666504, -7.52083158493042, -7.365591049194336, -7.210350036621094, -7.05510950088501, -6.899868965148926, -6.744627952575684, -6.5893874168396, -6.434146404266357, -6.278905868530273, -6.1236653327941895, -5.968424320220947, -5.813183784484863, -5.657942771911621, -5.502702713012695, -5.347462177276611, -5.192221164703369, -5.036980628967285, -4.881740093231201, -4.726499080657959, -4.571258544921875, -4.416017532348633, -4.260776519775391, -4.105535984039307, -3.9502952098846436, -3.7950544357299805, -3.6398136615753174, -3.4845728874206543, -3.3293323516845703, -3.1740915775299072, -3.0188510417938232, -2.86361026763916, -2.708369731903076, -2.553128957748413, -2.39788818359375, -2.242647647857666, -2.087406873703003, -1.9321660995483398, -1.7769255638122559, -1.6216849088668823, -1.4664441347122192, -1.3112034797668457, -1.1559627056121826, -1.000722050666809, -0.8454813957214355, -0.6902406215667725, -0.5349999070167542, -0.37975919246673584, -0.22451850771903992, -0.069277822971344, 0.08596289157867432, 0.24120360612869263, 0.39644426107406616, 0.5516850352287292, 0.7069256901741028]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 2.0, 8.0, 6.0, 9.0, 9.0, 13.0, 16.0, 15.0, 11.0, 14.0, 33.0, 24.0, 29.0, 22.0, 36.0, 35.0, 29.0, 38.0, 40.0, 37.0, 43.0, 36.0, 36.0, 39.0, 48.0, 42.0, 23.0, 33.0, 36.0, 27.0, 34.0, 22.0, 19.0, 19.0, 22.0, 15.0, 12.0, 19.0, 12.0, 8.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.6587540507316589, -0.6377313137054443, -0.6167086362838745, -0.5956858992576599, -0.5746631622314453, -0.5536404848098755, -0.5326177477836609, -0.5115950107574463, -0.4905723035335541, -0.46954959630966187, -0.44852685928344727, -0.42750415205955505, -0.40648144483566284, -0.38545870780944824, -0.36443600058555603, -0.3434132933616638, -0.3223905563354492, -0.301367849111557, -0.2803451120853424, -0.2593224048614502, -0.2382996827363968, -0.21727696061134338, -0.19625425338745117, -0.17523153126239777, -0.15420880913734436, -0.13318608701229095, -0.11216337233781815, -0.09114065766334534, -0.07011793553829193, -0.049095213413238525, -0.028072506189346313, -0.007049784064292908, 0.013972878456115723, 0.03499559685587883, 0.05601831525564194, 0.07704102993011475, 0.09806375205516815, 0.11908647418022156, 0.14010918140411377, 0.16113190352916718, 0.18215462565422058, 0.203177347779274, 0.2242000699043274, 0.2452227771282196, 0.2662454843521118, 0.2872682213783264, 0.30829092860221863, 0.32931363582611084, 0.35033637285232544, 0.37135908007621765, 0.39238181710243225, 0.41340452432632446, 0.43442726135253906, 0.4554499685764313, 0.4764726758003235, 0.4974954128265381, 0.5185180902481079, 0.5395408272743225, 0.5605635046958923, 0.5815862417221069, 0.6026089787483215, 0.6236317157745361, 0.644654393196106, 0.6656771302223206, 0.6866998672485352]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 4.0, 9.0, 10.0, 6.0, 18.0, 20.0, 17.0, 29.0, 41.0, 61.0, 84.0, 156.0, 220.0, 402.0, 733.0, 1519.0, 3526.0, 9054.0, 25921.0, 81428.0, 239638.0, 376133.0, 206335.0, 67336.0, 21712.0, 7838.0, 3155.0, 1415.0, 681.0, 398.0, 217.0, 125.0, 77.0, 64.0, 52.0, 31.0, 23.0, 10.0, 9.0, 7.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.99609375, -0.9671554565429688, -0.9382171630859375, -0.9092788696289062, -0.880340576171875, -0.8514022827148438, -0.8224639892578125, -0.7935256958007812, -0.76458740234375, -0.7356491088867188, -0.7067108154296875, -0.6777725219726562, -0.648834228515625, -0.6198959350585938, -0.5909576416015625, -0.5620193481445312, -0.5330810546875, -0.5041427612304688, -0.4752044677734375, -0.44626617431640625, -0.417327880859375, -0.38838958740234375, -0.3594512939453125, -0.33051300048828125, -0.30157470703125, -0.27263641357421875, -0.2436981201171875, -0.21475982666015625, -0.185821533203125, -0.15688323974609375, -0.1279449462890625, -0.09900665283203125, -0.070068359375, -0.04113006591796875, -0.0121917724609375, 0.01674652099609375, 0.045684814453125, 0.07462310791015625, 0.1035614013671875, 0.13249969482421875, 0.16143798828125, 0.19037628173828125, 0.2193145751953125, 0.24825286865234375, 0.277191162109375, 0.30612945556640625, 0.3350677490234375, 0.36400604248046875, 0.3929443359375, 0.42188262939453125, 0.4508209228515625, 0.47975921630859375, 0.508697509765625, 0.5376358032226562, 0.5665740966796875, 0.5955123901367188, 0.62445068359375, 0.6533889770507812, 0.6823272705078125, 0.7112655639648438, 0.740203857421875, 0.7691421508789062, 0.7980804443359375, 0.8270187377929688, 0.85595703125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 8.0, 14.0, 19.0, 22.0, 24.0, 22.0, 26.0, 45.0, 39.0, 43.0, 57.0, 51.0, 52.0, 51.0, 54.0, 54.0, 43.0, 37.0, 44.0, 35.0, 44.0, 32.0, 33.0, 32.0, 13.0, 10.0, 10.0, 11.0, 9.0, 9.0, 5.0, 4.0, 4.0, 5.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3359375, -0.32544708251953125, -0.3149566650390625, -0.30446624755859375, -0.293975830078125, -0.28348541259765625, -0.2729949951171875, -0.26250457763671875, -0.25201416015625, -0.24152374267578125, -0.2310333251953125, -0.22054290771484375, -0.210052490234375, -0.19956207275390625, -0.1890716552734375, -0.17858123779296875, -0.1680908203125, -0.15760040283203125, -0.1471099853515625, -0.13661956787109375, -0.126129150390625, -0.11563873291015625, -0.1051483154296875, -0.09465789794921875, -0.08416748046875, -0.07367706298828125, -0.0631866455078125, -0.05269622802734375, -0.042205810546875, -0.03171539306640625, -0.0212249755859375, -0.01073455810546875, -0.000244140625, 0.01024627685546875, 0.0207366943359375, 0.03122711181640625, 0.041717529296875, 0.05220794677734375, 0.0626983642578125, 0.07318878173828125, 0.08367919921875, 0.09416961669921875, 0.1046600341796875, 0.11515045166015625, 0.125640869140625, 0.13613128662109375, 0.1466217041015625, 0.15711212158203125, 0.1676025390625, 0.17809295654296875, 0.1885833740234375, 0.19907379150390625, 0.209564208984375, 0.22005462646484375, 0.2305450439453125, 0.24103546142578125, 0.25152587890625, 0.26201629638671875, 0.2725067138671875, 0.28299713134765625, 0.293487548828125, 0.30397796630859375, 0.3144683837890625, 0.32495880126953125, 0.33544921875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 9.0, 18.0, 15.0, 31.0, 26.0, 45.0, 76.0, 91.0, 184.0, 257.0, 459.0, 808.0, 1749.0, 3962.0, 11173.0, 44029.0, 266752.0, 562989.0, 120254.0, 23109.0, 6898.0, 2714.0, 1290.0, 620.0, 376.0, 222.0, 136.0, 83.0, 51.0, 43.0, 22.0, 24.0, 9.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.306640625, -1.2648773193359375, -1.223114013671875, -1.1813507080078125, -1.13958740234375, -1.0978240966796875, -1.056060791015625, -1.0142974853515625, -0.9725341796875, -0.9307708740234375, -0.889007568359375, -0.8472442626953125, -0.80548095703125, -0.7637176513671875, -0.721954345703125, -0.6801910400390625, -0.638427734375, -0.5966644287109375, -0.554901123046875, -0.5131378173828125, -0.47137451171875, -0.4296112060546875, -0.387847900390625, -0.3460845947265625, -0.3043212890625, -0.2625579833984375, -0.220794677734375, -0.1790313720703125, -0.13726806640625, -0.0955047607421875, -0.053741455078125, -0.0119781494140625, 0.02978515625, 0.0715484619140625, 0.113311767578125, 0.1550750732421875, 0.19683837890625, 0.2386016845703125, 0.280364990234375, 0.3221282958984375, 0.3638916015625, 0.4056549072265625, 0.447418212890625, 0.4891815185546875, 0.53094482421875, 0.5727081298828125, 0.614471435546875, 0.6562347412109375, 0.697998046875, 0.7397613525390625, 0.781524658203125, 0.8232879638671875, 0.86505126953125, 0.9068145751953125, 0.948577880859375, 0.9903411865234375, 1.0321044921875, 1.0738677978515625, 1.115631103515625, 1.1573944091796875, 1.19915771484375, 1.2409210205078125, 1.282684326171875, 1.3244476318359375, 1.3662109375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 8.0, 5.0, 14.0, 19.0, 20.0, 30.0, 28.0, 34.0, 40.0, 44.0, 40.0, 59.0, 45.0, 63.0, 54.0, 61.0, 65.0, 43.0, 49.0, 49.0, 30.0, 39.0, 32.0, 27.0, 19.0, 15.0, 16.0, 6.0, 10.0, 11.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4951171875, -1.441497802734375, -1.38787841796875, -1.334259033203125, -1.2806396484375, -1.227020263671875, -1.17340087890625, -1.119781494140625, -1.066162109375, -1.012542724609375, -0.95892333984375, -0.905303955078125, -0.8516845703125, -0.798065185546875, -0.74444580078125, -0.690826416015625, -0.63720703125, -0.583587646484375, -0.52996826171875, -0.476348876953125, -0.4227294921875, -0.369110107421875, -0.31549072265625, -0.261871337890625, -0.208251953125, -0.154632568359375, -0.10101318359375, -0.047393798828125, 0.0062255859375, 0.059844970703125, 0.11346435546875, 0.167083740234375, 0.220703125, 0.274322509765625, 0.32794189453125, 0.381561279296875, 0.4351806640625, 0.488800048828125, 0.54241943359375, 0.596038818359375, 0.649658203125, 0.703277587890625, 0.75689697265625, 0.810516357421875, 0.8641357421875, 0.917755126953125, 0.97137451171875, 1.024993896484375, 1.07861328125, 1.132232666015625, 1.18585205078125, 1.239471435546875, 1.2930908203125, 1.346710205078125, 1.40032958984375, 1.453948974609375, 1.507568359375, 1.561187744140625, 1.61480712890625, 1.668426513671875, 1.7220458984375, 1.775665283203125, 1.82928466796875, 1.882904052734375, 1.9365234375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 10.0, 6.0, 39.0, 71.0, 146.0, 342.0, 944.0, 3860.0, 72160.0, 948272.0, 19481.0, 2055.0, 649.0, 264.0, 134.0, 52.0, 34.0, 11.0, 8.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.29730224609375, -2.2215576171875, -2.14581298828125, -2.070068359375, -1.99432373046875, -1.9185791015625, -1.84283447265625, -1.76708984375, -1.69134521484375, -1.6156005859375, -1.53985595703125, -1.464111328125, -1.38836669921875, -1.3126220703125, -1.23687744140625, -1.1611328125, -1.08538818359375, -1.0096435546875, -0.93389892578125, -0.858154296875, -0.78240966796875, -0.7066650390625, -0.63092041015625, -0.55517578125, -0.47943115234375, -0.4036865234375, -0.32794189453125, -0.252197265625, -0.17645263671875, -0.1007080078125, -0.02496337890625, 0.05078125, 0.12652587890625, 0.2022705078125, 0.27801513671875, 0.353759765625, 0.42950439453125, 0.5052490234375, 0.58099365234375, 0.65673828125, 0.73248291015625, 0.8082275390625, 0.88397216796875, 0.959716796875, 1.03546142578125, 1.1112060546875, 1.18695068359375, 1.2626953125, 1.33843994140625, 1.4141845703125, 1.48992919921875, 1.565673828125, 1.64141845703125, 1.7171630859375, 1.79290771484375, 1.86865234375, 1.94439697265625, 2.0201416015625, 2.09588623046875, 2.171630859375, 2.24737548828125, 2.3231201171875, 2.39886474609375, 2.474609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 13.0, 18.0, 38.0, 76.0, 160.0, 193.0, 211.0, 149.0, 78.0, 42.0, 18.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003209114074707031, -0.0003134477883577347, -0.00030598416924476624, -0.0002985205501317978, -0.00029105693101882935, -0.0002835933119058609, -0.00027612969279289246, -0.000268666073679924, -0.00026120245456695557, -0.0002537388354539871, -0.0002462752163410187, -0.00023881159722805023, -0.0002313479781150818, -0.00022388435900211334, -0.0002164207398891449, -0.00020895712077617645, -0.000201493501663208, -0.00019402988255023956, -0.00018656626343727112, -0.00017910264432430267, -0.00017163902521133423, -0.00016417540609836578, -0.00015671178698539734, -0.0001492481678724289, -0.00014178454875946045, -0.000134320929646492, -0.00012685731053352356, -0.00011939369142055511, -0.00011193007230758667, -0.00010446645319461823, -9.700283408164978e-05, -8.953921496868134e-05, -8.207559585571289e-05, -7.461197674274445e-05, -6.7148357629776e-05, -5.9684738516807556e-05, -5.222111940383911e-05, -4.4757500290870667e-05, -3.729388117790222e-05, -2.9830262064933777e-05, -2.2366642951965332e-05, -1.4903023838996887e-05, -7.439404726028442e-06, 2.421438694000244e-08, 7.487833499908447e-06, 1.4951452612876892e-05, 2.2415071725845337e-05, 2.9878690838813782e-05, 3.7342309951782227e-05, 4.480592906475067e-05, 5.2269548177719116e-05, 5.973316729068756e-05, 6.7196786403656e-05, 7.466040551662445e-05, 8.21240246295929e-05, 8.958764374256134e-05, 9.705126285552979e-05, 0.00010451488196849823, 0.00011197850108146667, 0.00011944212019443512, 0.00012690573930740356, 0.000134369358420372, 0.00014183297753334045, 0.0001492965966463089, 0.00015676021575927734]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 9.0, 17.0, 27.0, 40.0, 73.0, 159.0, 341.0, 925.0, 4243.0, 55987.0, 947725.0, 34236.0, 3315.0, 806.0, 319.0, 135.0, 88.0, 43.0, 14.0, 21.0, 12.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.125, -2.065032958984375, -2.00506591796875, -1.945098876953125, -1.8851318359375, -1.825164794921875, -1.76519775390625, -1.705230712890625, -1.645263671875, -1.585296630859375, -1.52532958984375, -1.465362548828125, -1.4053955078125, -1.345428466796875, -1.28546142578125, -1.225494384765625, -1.16552734375, -1.105560302734375, -1.04559326171875, -0.985626220703125, -0.9256591796875, -0.865692138671875, -0.80572509765625, -0.745758056640625, -0.685791015625, -0.625823974609375, -0.56585693359375, -0.505889892578125, -0.4459228515625, -0.385955810546875, -0.32598876953125, -0.266021728515625, -0.2060546875, -0.146087646484375, -0.08612060546875, -0.026153564453125, 0.0338134765625, 0.093780517578125, 0.15374755859375, 0.213714599609375, 0.273681640625, 0.333648681640625, 0.39361572265625, 0.453582763671875, 0.5135498046875, 0.573516845703125, 0.63348388671875, 0.693450927734375, 0.75341796875, 0.813385009765625, 0.87335205078125, 0.933319091796875, 0.9932861328125, 1.053253173828125, 1.11322021484375, 1.173187255859375, 1.233154296875, 1.293121337890625, 1.35308837890625, 1.413055419921875, 1.4730224609375, 1.532989501953125, 1.59295654296875, 1.652923583984375, 1.712890625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 2.0, 2.0, 5.0, 11.0, 12.0, 16.0, 24.0, 42.0, 74.0, 109.0, 124.0, 163.0, 159.0, 108.0, 57.0, 37.0, 21.0, 7.0, 7.0, 11.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.86328125, -1.8203811645507812, -1.7774810791015625, -1.7345809936523438, -1.691680908203125, -1.6487808227539062, -1.6058807373046875, -1.5629806518554688, -1.52008056640625, -1.4771804809570312, -1.4342803955078125, -1.3913803100585938, -1.348480224609375, -1.3055801391601562, -1.2626800537109375, -1.2197799682617188, -1.1768798828125, -1.1339797973632812, -1.0910797119140625, -1.0481796264648438, -1.005279541015625, -0.9623794555664062, -0.9194793701171875, -0.8765792846679688, -0.83367919921875, -0.7907791137695312, -0.7478790283203125, -0.7049789428710938, -0.662078857421875, -0.6191787719726562, -0.5762786865234375, -0.5333786010742188, -0.490478515625, -0.44757843017578125, -0.4046783447265625, -0.36177825927734375, -0.318878173828125, -0.27597808837890625, -0.2330780029296875, -0.19017791748046875, -0.14727783203125, -0.10437774658203125, -0.0614776611328125, -0.01857757568359375, 0.024322509765625, 0.06722259521484375, 0.1101226806640625, 0.15302276611328125, 0.1959228515625, 0.23882293701171875, 0.2817230224609375, 0.32462310791015625, 0.367523193359375, 0.41042327880859375, 0.4533233642578125, 0.49622344970703125, 0.53912353515625, 0.5820236206054688, 0.6249237060546875, 0.6678237915039062, 0.710723876953125, 0.7536239624023438, 0.7965240478515625, 0.8394241333007812, 0.88232421875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 4.0, 6.0, 9.0, 9.0, 18.0, 21.0, 37.0, 46.0, 66.0, 89.0, 105.0, 116.0, 130.0, 88.0, 87.0, 53.0, 41.0, 25.0, 18.0, 14.0, 7.0, 3.0, 6.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.19670581817627, -12.809350967407227, -12.421996116638184, -12.03464126586914, -11.647287368774414, -11.259932518005371, -10.872577667236328, -10.485222816467285, -10.097867965698242, -9.7105131149292, -9.323158264160156, -8.935803413391113, -8.54844856262207, -8.161094665527344, -7.773739814758301, -7.386384963989258, -6.999030113220215, -6.611675262451172, -6.224320411682129, -5.836966037750244, -5.449611186981201, -5.062256336212158, -4.674901962280273, -4.2875471115112305, -3.9001922607421875, -3.5128374099731445, -3.1254827976226807, -2.738128185272217, -2.350773334503174, -1.9634186029434204, -1.576063871383667, -1.1887092590332031, -0.8013553619384766, -0.41400063037872314, -0.026645898818969727, 0.3607088327407837, 0.7480635643005371, 1.1354182958602905, 1.522773027420044, 1.9101276397705078, 2.297482490539551, 2.6848373413085938, 3.0721919536590576, 3.4595465660095215, 3.8469014167785645, 4.234256267547607, 4.621610641479492, 5.008965492248535, 5.396320343017578, 5.783675193786621, 6.171030044555664, 6.558384418487549, 6.945739269256592, 7.333094120025635, 7.7204484939575195, 8.107803344726562, 8.495158195495605, 8.882513046264648, 9.269867897033691, 9.657222747802734, 10.044576644897461, 10.431931495666504, 10.819286346435547, 11.20664119720459, 11.593996047973633]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 6.0, 6.0, 10.0, 6.0, 15.0, 12.0, 19.0, 16.0, 24.0, 35.0, 18.0, 34.0, 27.0, 42.0, 29.0, 49.0, 47.0, 51.0, 42.0, 43.0, 47.0, 43.0, 43.0, 41.0, 39.0, 29.0, 28.0, 33.0, 27.0, 18.0, 22.0, 24.0, 14.0, 7.0, 8.0, 5.0, 7.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.183813095092773, -6.948230743408203, -6.712648391723633, -6.4770660400390625, -6.241483688354492, -6.005901336669922, -5.770318984985352, -5.534736633300781, -5.299154281616211, -5.063571929931641, -4.82798957824707, -4.5924072265625, -4.35682487487793, -4.121242523193359, -3.88565993309021, -3.6500775814056396, -3.4144949913024902, -3.17891263961792, -2.9433302879333496, -2.7077479362487793, -2.472165584564209, -2.2365832328796387, -2.0010006427764893, -1.765418291091919, -1.5298359394073486, -1.2942535877227783, -1.058671236038208, -0.8230887651443481, -0.5875064134597778, -0.3519240617752075, -0.11634159088134766, 0.11924076080322266, 0.35482358932495117, 0.5904059410095215, 0.8259883522987366, 1.0615707635879517, 1.297153115272522, 1.5327354669570923, 1.7683179378509521, 2.0039002895355225, 2.2394826412200928, 2.475064992904663, 2.7106473445892334, 2.946229934692383, 3.181812286376953, 3.4173946380615234, 3.6529769897460938, 3.888559341430664, 4.124141693115234, 4.359724044799805, 4.595306396484375, 4.830888748168945, 5.066471099853516, 5.302053451538086, 5.537635803222656, 5.773218154907227, 6.008800506591797, 6.244382858276367, 6.4799652099609375, 6.715547561645508, 6.951129913330078, 7.186712265014648, 7.422294616699219, 7.657876968383789, 7.893459796905518]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 9.0, 7.0, 10.0, 10.0, 20.0, 41.0, 85.0, 141.0, 249.0, 628.0, 2472.0, 25277.0, 4145818.0, 16380.0, 2017.0, 570.0, 225.0, 128.0, 79.0, 47.0, 20.0, 11.0, 18.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.24609375, -4.1065673828125, -3.967041015625, -3.8275146484375, -3.68798828125, -3.5484619140625, -3.408935546875, -3.2694091796875, -3.1298828125, -2.9903564453125, -2.850830078125, -2.7113037109375, -2.57177734375, -2.4322509765625, -2.292724609375, -2.1531982421875, -2.013671875, -1.8741455078125, -1.734619140625, -1.5950927734375, -1.45556640625, -1.3160400390625, -1.176513671875, -1.0369873046875, -0.8974609375, -0.7579345703125, -0.618408203125, -0.4788818359375, -0.33935546875, -0.1998291015625, -0.060302734375, 0.0792236328125, 0.21875, 0.3582763671875, 0.497802734375, 0.6373291015625, 0.77685546875, 0.9163818359375, 1.055908203125, 1.1954345703125, 1.3349609375, 1.4744873046875, 1.614013671875, 1.7535400390625, 1.89306640625, 2.0325927734375, 2.172119140625, 2.3116455078125, 2.451171875, 2.5906982421875, 2.730224609375, 2.8697509765625, 3.00927734375, 3.1488037109375, 3.288330078125, 3.4278564453125, 3.5673828125, 3.7069091796875, 3.846435546875, 3.9859619140625, 4.12548828125, 4.2650146484375, 4.404541015625, 4.5440673828125, 4.68359375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 5.0, 8.0, 7.0, 14.0, 18.0, 17.0, 14.0, 24.0, 35.0, 38.0, 39.0, 35.0, 40.0, 40.0, 44.0, 55.0, 51.0, 49.0, 57.0, 57.0, 42.0, 45.0, 33.0, 32.0, 31.0, 29.0, 25.0, 18.0, 22.0, 15.0, 12.0, 5.0, 10.0, 7.0, 7.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.343994140625, -0.3327140808105469, -0.32143402099609375, -0.3101539611816406, -0.2988739013671875, -0.2875938415527344, -0.27631378173828125, -0.2650337219238281, -0.253753662109375, -0.24247360229492188, -0.23119354248046875, -0.21991348266601562, -0.2086334228515625, -0.19735336303710938, -0.18607330322265625, -0.17479324340820312, -0.16351318359375, -0.15223312377929688, -0.14095306396484375, -0.12967300415039062, -0.1183929443359375, -0.10711288452148438, -0.09583282470703125, -0.08455276489257812, -0.073272705078125, -0.061992645263671875, -0.05071258544921875, -0.039432525634765625, -0.0281524658203125, -0.016872406005859375, -0.00559234619140625, 0.005687713623046875, 0.0169677734375, 0.028247833251953125, 0.03952789306640625, 0.050807952880859375, 0.0620880126953125, 0.07336807250976562, 0.08464813232421875, 0.09592819213867188, 0.107208251953125, 0.11848831176757812, 0.12976837158203125, 0.14104843139648438, 0.1523284912109375, 0.16360855102539062, 0.17488861083984375, 0.18616867065429688, 0.19744873046875, 0.20872879028320312, 0.22000885009765625, 0.23128890991210938, 0.2425689697265625, 0.2538490295410156, 0.26512908935546875, 0.2764091491699219, 0.287689208984375, 0.2989692687988281, 0.31024932861328125, 0.3215293884277344, 0.3328094482421875, 0.3440895080566406, 0.35536956787109375, 0.3666496276855469, 0.3779296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 9.0, 12.0, 13.0, 32.0, 34.0, 47.0, 52.0, 132.0, 153.0, 245.0, 411.0, 735.0, 1429.0, 3799.0, 15956.0, 307409.0, 3835657.0, 20162.0, 4373.0, 1617.0, 785.0, 429.0, 241.0, 177.0, 118.0, 98.0, 51.0, 33.0, 20.0, 8.0, 16.0, 8.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.358306884765625, -2.27716064453125, -2.196014404296875, -2.1148681640625, -2.033721923828125, -1.95257568359375, -1.871429443359375, -1.790283203125, -1.709136962890625, -1.62799072265625, -1.546844482421875, -1.4656982421875, -1.384552001953125, -1.30340576171875, -1.222259521484375, -1.14111328125, -1.059967041015625, -0.97882080078125, -0.897674560546875, -0.8165283203125, -0.735382080078125, -0.65423583984375, -0.573089599609375, -0.491943359375, -0.410797119140625, -0.32965087890625, -0.248504638671875, -0.1673583984375, -0.086212158203125, -0.00506591796875, 0.076080322265625, 0.1572265625, 0.238372802734375, 0.31951904296875, 0.400665283203125, 0.4818115234375, 0.562957763671875, 0.64410400390625, 0.725250244140625, 0.806396484375, 0.887542724609375, 0.96868896484375, 1.049835205078125, 1.1309814453125, 1.212127685546875, 1.29327392578125, 1.374420166015625, 1.45556640625, 1.536712646484375, 1.61785888671875, 1.699005126953125, 1.7801513671875, 1.861297607421875, 1.94244384765625, 2.023590087890625, 2.104736328125, 2.185882568359375, 2.26702880859375, 2.348175048828125, 2.4293212890625, 2.510467529296875, 2.59161376953125, 2.672760009765625, 2.75390625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 15.0, 18.0, 41.0, 94.0, 2972.0, 764.0, 76.0, 31.0, 20.0, 9.0, 11.0, 8.0, 8.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.78839111328125, -0.7686767578125, -0.74896240234375, -0.729248046875, -0.70953369140625, -0.6898193359375, -0.67010498046875, -0.650390625, -0.63067626953125, -0.6109619140625, -0.59124755859375, -0.571533203125, -0.55181884765625, -0.5321044921875, -0.51239013671875, -0.49267578125, -0.47296142578125, -0.4532470703125, -0.43353271484375, -0.413818359375, -0.39410400390625, -0.3743896484375, -0.35467529296875, -0.3349609375, -0.31524658203125, -0.2955322265625, -0.27581787109375, -0.256103515625, -0.23638916015625, -0.2166748046875, -0.19696044921875, -0.17724609375, -0.15753173828125, -0.1378173828125, -0.11810302734375, -0.098388671875, -0.07867431640625, -0.0589599609375, -0.03924560546875, -0.01953125, 0.00018310546875, 0.0198974609375, 0.03961181640625, 0.059326171875, 0.07904052734375, 0.0987548828125, 0.11846923828125, 0.13818359375, 0.15789794921875, 0.1776123046875, 0.19732666015625, 0.217041015625, 0.23675537109375, 0.2564697265625, 0.27618408203125, 0.2958984375, 0.31561279296875, 0.3353271484375, 0.35504150390625, 0.374755859375, 0.39447021484375, 0.4141845703125, 0.43389892578125, 0.45361328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 18.0, 19.0, 30.0, 48.0, 82.0, 106.0, 115.0, 124.0, 122.0, 89.0, 75.0, 59.0, 41.0, 24.0, 13.0, 12.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.144212484359741, -2.0932729244232178, -2.0423333644866943, -1.9913936853408813, -1.940454125404358, -1.8895145654678345, -1.838575005531311, -1.787635326385498, -1.7366957664489746, -1.6857562065124512, -1.6348166465759277, -1.5838769674301147, -1.5329374074935913, -1.4819978475570679, -1.4310582876205444, -1.3801186084747314, -1.329179048538208, -1.2782394886016846, -1.2272999286651611, -1.1763602495193481, -1.1254206895828247, -1.0744811296463013, -1.0235415697097778, -0.9726019501686096, -0.921662449836731, -0.8707228899002075, -0.8197832703590393, -0.7688437104225159, -0.7179040908813477, -0.6669645309448242, -0.6160249710083008, -0.5650853514671326, -0.5141457319259644, -0.46320614218711853, -0.4122665524482727, -0.36132699251174927, -0.31038737297058105, -0.2594478130340576, -0.2085082232952118, -0.15756863355636597, -0.10662904381752014, -0.055689457803964615, -0.004749871790409088, 0.04618971049785614, 0.09712930023670197, 0.1480688750743866, 0.19900846481323242, 0.24994805455207825, 0.3008876442909241, 0.3518272340297699, 0.4027668237686157, 0.45370638370513916, 0.5046460032463074, 0.5555855631828308, 0.606525182723999, 0.6574647426605225, 0.7084043025970459, 0.7593438625335693, 0.8102834820747375, 0.861223042011261, 0.9121626615524292, 0.9631022214889526, 1.014041781425476, 1.064981460571289, 1.1159210205078125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 0.0, 4.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 13.0, 20.0, 24.0, 23.0, 25.0, 22.0, 29.0, 33.0, 31.0, 39.0, 38.0, 46.0, 44.0, 44.0, 45.0, 54.0, 38.0, 44.0, 36.0, 36.0, 34.0, 29.0, 32.0, 29.0, 17.0, 11.0, 19.0, 20.0, 13.0, 26.0, 11.0, 9.0, 6.0, 7.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.8593247532844543, -0.8347761034965515, -0.8102275133132935, -0.7856788635253906, -0.7611302137374878, -0.7365816235542297, -0.7120329737663269, -0.6874843835830688, -0.662935733795166, -0.6383870840072632, -0.6138384938240051, -0.5892898440361023, -0.5647412538528442, -0.5401926040649414, -0.5156439542770386, -0.49109533429145813, -0.4665467143058777, -0.44199809432029724, -0.4174494743347168, -0.39290082454681396, -0.3683522045612335, -0.3438035845756531, -0.31925493478775024, -0.2947063148021698, -0.27015769481658936, -0.2456090748310089, -0.22106043994426727, -0.19651180505752563, -0.1719631850719452, -0.14741456508636475, -0.12286593019962311, -0.09831729531288147, -0.07376861572265625, -0.04921998828649521, -0.024671360850334167, -0.00012273341417312622, 0.024425894021987915, 0.048974521458148956, 0.07352314889431, 0.09807178378105164, 0.12262040376663208, 0.14716902375221252, 0.17171765863895416, 0.1962662935256958, 0.22081491351127625, 0.2453635334968567, 0.2699121832847595, 0.29446080327033997, 0.3190094232559204, 0.34355804324150085, 0.3681066632270813, 0.39265531301498413, 0.4172039330005646, 0.441752552986145, 0.46630120277404785, 0.4908498227596283, 0.5153984427452087, 0.5399470925331116, 0.5644956827163696, 0.5890443325042725, 0.6135929822921753, 0.6381415724754333, 0.6626902222633362, 0.6872388124465942, 0.7117874622344971]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 6.0, 12.0, 9.0, 10.0, 20.0, 24.0, 25.0, 46.0, 49.0, 73.0, 97.0, 144.0, 250.0, 354.0, 561.0, 1043.0, 1829.0, 3875.0, 9421.0, 27491.0, 93302.0, 294836.0, 389129.0, 155724.0, 44975.0, 14076.0, 5415.0, 2492.0, 1260.0, 673.0, 418.0, 270.0, 170.0, 145.0, 93.0, 69.0, 37.0, 33.0, 24.0, 22.0, 15.0, 13.0, 8.0, 4.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88720703125, -0.8557510375976562, -0.8242950439453125, -0.7928390502929688, -0.761383056640625, -0.7299270629882812, -0.6984710693359375, -0.6670150756835938, -0.63555908203125, -0.6041030883789062, -0.5726470947265625, -0.5411911010742188, -0.509735107421875, -0.47827911376953125, -0.4468231201171875, -0.41536712646484375, -0.3839111328125, -0.35245513916015625, -0.3209991455078125, -0.28954315185546875, -0.258087158203125, -0.22663116455078125, -0.1951751708984375, -0.16371917724609375, -0.13226318359375, -0.10080718994140625, -0.0693511962890625, -0.03789520263671875, -0.006439208984375, 0.02501678466796875, 0.0564727783203125, 0.08792877197265625, 0.119384765625, 0.15084075927734375, 0.1822967529296875, 0.21375274658203125, 0.245208740234375, 0.27666473388671875, 0.3081207275390625, 0.33957672119140625, 0.37103271484375, 0.40248870849609375, 0.4339447021484375, 0.46540069580078125, 0.496856689453125, 0.5283126831054688, 0.5597686767578125, 0.5912246704101562, 0.6226806640625, 0.6541366577148438, 0.6855926513671875, 0.7170486450195312, 0.748504638671875, 0.7799606323242188, 0.8114166259765625, 0.8428726196289062, 0.87432861328125, 0.9057846069335938, 0.9372406005859375, 0.9686965942382812, 1.000152587890625, 1.0316085815429688, 1.0630645751953125, 1.0945205688476562, 1.1259765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 6.0, 7.0, 10.0, 9.0, 11.0, 20.0, 22.0, 25.0, 25.0, 29.0, 37.0, 30.0, 33.0, 43.0, 39.0, 51.0, 40.0, 62.0, 44.0, 51.0, 41.0, 50.0, 47.0, 31.0, 29.0, 25.0, 35.0, 25.0, 15.0, 15.0, 16.0, 12.0, 7.0, 8.0, 10.0, 5.0, 6.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3427734375, -0.3313484191894531, -0.31992340087890625, -0.3084983825683594, -0.2970733642578125, -0.2856483459472656, -0.27422332763671875, -0.2627983093261719, -0.251373291015625, -0.23994827270507812, -0.22852325439453125, -0.21709823608398438, -0.2056732177734375, -0.19424819946289062, -0.18282318115234375, -0.17139816284179688, -0.15997314453125, -0.14854812622070312, -0.13712310791015625, -0.12569808959960938, -0.1142730712890625, -0.10284805297851562, -0.09142303466796875, -0.07999801635742188, -0.068572998046875, -0.057147979736328125, -0.04572296142578125, -0.034297943115234375, -0.0228729248046875, -0.011447906494140625, -2.288818359375e-05, 0.011402130126953125, 0.0228271484375, 0.034252166748046875, 0.04567718505859375, 0.057102203369140625, 0.0685272216796875, 0.07995223999023438, 0.09137725830078125, 0.10280227661132812, 0.114227294921875, 0.12565231323242188, 0.13707733154296875, 0.14850234985351562, 0.1599273681640625, 0.17135238647460938, 0.18277740478515625, 0.19420242309570312, 0.20562744140625, 0.21705245971679688, 0.22847747802734375, 0.23990249633789062, 0.2513275146484375, 0.2627525329589844, 0.27417755126953125, 0.2856025695800781, 0.297027587890625, 0.3084526062011719, 0.31987762451171875, 0.3313026428222656, 0.3427276611328125, 0.3541526794433594, 0.36557769775390625, 0.3770027160644531, 0.388427734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 6.0, 5.0, 17.0, 18.0, 21.0, 33.0, 42.0, 64.0, 93.0, 135.0, 182.0, 299.0, 468.0, 778.0, 1337.0, 2629.0, 5981.0, 18485.0, 82802.0, 400384.0, 416557.0, 86633.0, 19166.0, 6062.0, 2755.0, 1383.0, 738.0, 479.0, 329.0, 209.0, 128.0, 110.0, 65.0, 37.0, 32.0, 23.0, 20.0, 13.0, 10.0, 8.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.04296875, -1.0057373046875, -0.968505859375, -0.9312744140625, -0.89404296875, -0.8568115234375, -0.819580078125, -0.7823486328125, -0.7451171875, -0.7078857421875, -0.670654296875, -0.6334228515625, -0.59619140625, -0.5589599609375, -0.521728515625, -0.4844970703125, -0.447265625, -0.4100341796875, -0.372802734375, -0.3355712890625, -0.29833984375, -0.2611083984375, -0.223876953125, -0.1866455078125, -0.1494140625, -0.1121826171875, -0.074951171875, -0.0377197265625, -0.00048828125, 0.0367431640625, 0.073974609375, 0.1112060546875, 0.1484375, 0.1856689453125, 0.222900390625, 0.2601318359375, 0.29736328125, 0.3345947265625, 0.371826171875, 0.4090576171875, 0.4462890625, 0.4835205078125, 0.520751953125, 0.5579833984375, 0.59521484375, 0.6324462890625, 0.669677734375, 0.7069091796875, 0.744140625, 0.7813720703125, 0.818603515625, 0.8558349609375, 0.89306640625, 0.9302978515625, 0.967529296875, 1.0047607421875, 1.0419921875, 1.0792236328125, 1.116455078125, 1.1536865234375, 1.19091796875, 1.2281494140625, 1.265380859375, 1.3026123046875, 1.33984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 5.0, 9.0, 6.0, 15.0, 14.0, 14.0, 19.0, 25.0, 17.0, 31.0, 20.0, 27.0, 36.0, 39.0, 35.0, 37.0, 59.0, 43.0, 40.0, 54.0, 40.0, 44.0, 42.0, 35.0, 40.0, 25.0, 35.0, 30.0, 28.0, 20.0, 17.0, 22.0, 14.0, 15.0, 9.0, 6.0, 6.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.646484375, -1.5935821533203125, -1.540679931640625, -1.4877777099609375, -1.43487548828125, -1.3819732666015625, -1.329071044921875, -1.2761688232421875, -1.2232666015625, -1.1703643798828125, -1.117462158203125, -1.0645599365234375, -1.01165771484375, -0.9587554931640625, -0.905853271484375, -0.8529510498046875, -0.800048828125, -0.7471466064453125, -0.694244384765625, -0.6413421630859375, -0.58843994140625, -0.5355377197265625, -0.482635498046875, -0.4297332763671875, -0.3768310546875, -0.3239288330078125, -0.271026611328125, -0.2181243896484375, -0.16522216796875, -0.1123199462890625, -0.059417724609375, -0.0065155029296875, 0.04638671875, 0.0992889404296875, 0.152191162109375, 0.2050933837890625, 0.25799560546875, 0.3108978271484375, 0.363800048828125, 0.4167022705078125, 0.4696044921875, 0.5225067138671875, 0.575408935546875, 0.6283111572265625, 0.68121337890625, 0.7341156005859375, 0.787017822265625, 0.8399200439453125, 0.892822265625, 0.9457244873046875, 0.998626708984375, 1.0515289306640625, 1.10443115234375, 1.1573333740234375, 1.210235595703125, 1.2631378173828125, 1.3160400390625, 1.3689422607421875, 1.421844482421875, 1.4747467041015625, 1.52764892578125, 1.5805511474609375, 1.633453369140625, 1.6863555908203125, 1.7392578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 12.0, 17.0, 24.0, 39.0, 98.0, 159.0, 351.0, 1131.0, 6785.0, 515700.0, 515519.0, 6939.0, 1116.0, 344.0, 146.0, 73.0, 33.0, 21.0, 17.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.58203125, -1.51611328125, -1.4501953125, -1.38427734375, -1.318359375, -1.25244140625, -1.1865234375, -1.12060546875, -1.0546875, -0.98876953125, -0.9228515625, -0.85693359375, -0.791015625, -0.72509765625, -0.6591796875, -0.59326171875, -0.52734375, -0.46142578125, -0.3955078125, -0.32958984375, -0.263671875, -0.19775390625, -0.1318359375, -0.06591796875, 0.0, 0.06591796875, 0.1318359375, 0.19775390625, 0.263671875, 0.32958984375, 0.3955078125, 0.46142578125, 0.52734375, 0.59326171875, 0.6591796875, 0.72509765625, 0.791015625, 0.85693359375, 0.9228515625, 0.98876953125, 1.0546875, 1.12060546875, 1.1865234375, 1.25244140625, 1.318359375, 1.38427734375, 1.4501953125, 1.51611328125, 1.58203125, 1.64794921875, 1.7138671875, 1.77978515625, 1.845703125, 1.91162109375, 1.9775390625, 2.04345703125, 2.109375, 2.17529296875, 2.2412109375, 2.30712890625, 2.373046875, 2.43896484375, 2.5048828125, 2.57080078125, 2.63671875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 8.0, 7.0, 8.0, 17.0, 14.0, 17.0, 34.0, 25.0, 47.0, 54.0, 62.0, 66.0, 72.0, 94.0, 71.0, 65.0, 70.0, 44.0, 51.0, 38.0, 31.0, 15.0, 17.0, 18.0, 11.0, 9.0, 7.0, 4.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.302927017211914e-05, -8.033681660890579e-05, -7.764436304569244e-05, -7.49519094824791e-05, -7.225945591926575e-05, -6.95670023560524e-05, -6.687454879283905e-05, -6.41820952296257e-05, -6.148964166641235e-05, -5.8797188103199005e-05, -5.610473453998566e-05, -5.341228097677231e-05, -5.071982741355896e-05, -4.802737385034561e-05, -4.533492028713226e-05, -4.2642466723918915e-05, -3.9950013160705566e-05, -3.725755959749222e-05, -3.456510603427887e-05, -3.187265247106552e-05, -2.9180198907852173e-05, -2.6487745344638824e-05, -2.3795291781425476e-05, -2.1102838218212128e-05, -1.841038465499878e-05, -1.571793109178543e-05, -1.3025477528572083e-05, -1.0333023965358734e-05, -7.640570402145386e-06, -4.948116838932037e-06, -2.255663275718689e-06, 4.367902874946594e-07, 3.129243850708008e-06, 5.821697413921356e-06, 8.514150977134705e-06, 1.1206604540348053e-05, 1.3899058103561401e-05, 1.659151166677475e-05, 1.9283965229988098e-05, 2.1976418793201447e-05, 2.4668872356414795e-05, 2.7361325919628143e-05, 3.0053779482841492e-05, 3.274623304605484e-05, 3.543868660926819e-05, 3.813114017248154e-05, 4.0823593735694885e-05, 4.3516047298908234e-05, 4.620850086212158e-05, 4.890095442533493e-05, 5.159340798854828e-05, 5.428586155176163e-05, 5.6978315114974976e-05, 5.9670768678188324e-05, 6.236322224140167e-05, 6.505567580461502e-05, 6.774812936782837e-05, 7.044058293104172e-05, 7.313303649425507e-05, 7.582549005746841e-05, 7.851794362068176e-05, 8.121039718389511e-05, 8.390285074710846e-05, 8.659530431032181e-05, 8.928775787353516e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 25.0, 34.0, 66.0, 154.0, 350.0, 1091.0, 7040.0, 341367.0, 685280.0, 10977.0, 1403.0, 423.0, 144.0, 73.0, 38.0, 29.0, 18.0, 8.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.328125, -1.272979736328125, -1.21783447265625, -1.162689208984375, -1.1075439453125, -1.052398681640625, -0.99725341796875, -0.942108154296875, -0.886962890625, -0.831817626953125, -0.77667236328125, -0.721527099609375, -0.6663818359375, -0.611236572265625, -0.55609130859375, -0.500946044921875, -0.44580078125, -0.390655517578125, -0.33551025390625, -0.280364990234375, -0.2252197265625, -0.170074462890625, -0.11492919921875, -0.059783935546875, -0.004638671875, 0.050506591796875, 0.10565185546875, 0.160797119140625, 0.2159423828125, 0.271087646484375, 0.32623291015625, 0.381378173828125, 0.4365234375, 0.491668701171875, 0.54681396484375, 0.601959228515625, 0.6571044921875, 0.712249755859375, 0.76739501953125, 0.822540283203125, 0.877685546875, 0.932830810546875, 0.98797607421875, 1.043121337890625, 1.0982666015625, 1.153411865234375, 1.20855712890625, 1.263702392578125, 1.31884765625, 1.373992919921875, 1.42913818359375, 1.484283447265625, 1.5394287109375, 1.594573974609375, 1.64971923828125, 1.704864501953125, 1.760009765625, 1.815155029296875, 1.87030029296875, 1.925445556640625, 1.9805908203125, 2.035736083984375, 2.09088134765625, 2.146026611328125, 2.201171875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 12.0, 15.0, 28.0, 30.0, 50.0, 94.0, 116.0, 152.0, 149.0, 127.0, 88.0, 43.0, 33.0, 28.0, 15.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7096939086914062, -0.6679229736328125, -0.6261520385742188, -0.584381103515625, -0.5426101684570312, -0.5008392333984375, -0.45906829833984375, -0.41729736328125, -0.37552642822265625, -0.3337554931640625, -0.29198455810546875, -0.250213623046875, -0.20844268798828125, -0.1666717529296875, -0.12490081787109375, -0.0831298828125, -0.04135894775390625, 0.0004119873046875, 0.04218292236328125, 0.083953857421875, 0.12572479248046875, 0.1674957275390625, 0.20926666259765625, 0.25103759765625, 0.29280853271484375, 0.3345794677734375, 0.37635040283203125, 0.418121337890625, 0.45989227294921875, 0.5016632080078125, 0.5434341430664062, 0.585205078125, 0.6269760131835938, 0.6687469482421875, 0.7105178833007812, 0.752288818359375, 0.7940597534179688, 0.8358306884765625, 0.8776016235351562, 0.91937255859375, 0.9611434936523438, 1.0029144287109375, 1.0446853637695312, 1.086456298828125, 1.1282272338867188, 1.1699981689453125, 1.2117691040039062, 1.2535400390625, 1.2953109741210938, 1.3370819091796875, 1.3788528442382812, 1.420623779296875, 1.4623947143554688, 1.5041656494140625, 1.5459365844726562, 1.58770751953125, 1.6294784545898438, 1.6712493896484375, 1.7130203247070312, 1.754791259765625, 1.7965621948242188, 1.8383331298828125, 1.8801040649414062, 1.921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 8.0, 10.0, 94.0, 414.0, 396.0, 72.0, 15.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.544710159301758, -6.038434982299805, -4.532159328460693, -3.025883674621582, -1.519608497619629, -0.013333320617675781, 1.4929428100585938, 2.999217987060547, 4.5054931640625, 6.011768341064453, 7.5180439949035645, 9.024319648742676, 10.530594825744629, 12.036870002746582, 13.543146133422852, 15.049421310424805, 16.555696487426758, 18.06197166442871, 19.568246841430664, 21.07452392578125, 22.580799102783203, 24.087074279785156, 25.59334945678711, 27.099624633789062, 28.605899810791016, 30.11217498779297, 31.618450164794922, 33.124725341796875, 34.63100051879883, 36.13727569580078, 37.6435546875, 39.14982604980469, 40.656105041503906, 42.16238021850586, 43.66865539550781, 45.174930572509766, 46.68120574951172, 48.18748092651367, 49.693756103515625, 51.200035095214844, 52.70630645751953, 54.212581634521484, 55.71885681152344, 57.22513198852539, 58.731407165527344, 60.2376823425293, 61.74395751953125, 63.25023651123047, 64.75651550292969, 66.2627944946289, 67.7690658569336, 69.27534484863281, 70.7816162109375, 72.28789520263672, 73.7941665649414, 75.30044555664062, 76.80671691894531, 78.31299591064453, 79.81926727294922, 81.32554626464844, 82.83181762695312, 84.33809661865234, 85.84436798095703, 87.35064697265625, 88.85691833496094]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 6.0, 5.0, 8.0, 12.0, 12.0, 20.0, 15.0, 23.0, 16.0, 20.0, 38.0, 28.0, 44.0, 31.0, 48.0, 37.0, 46.0, 52.0, 50.0, 63.0, 50.0, 46.0, 38.0, 47.0, 33.0, 31.0, 28.0, 21.0, 12.0, 23.0, 16.0, 15.0, 12.0, 12.0, 9.0, 7.0, 1.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.179851531982422, -7.908729076385498, -7.637606143951416, -7.366483688354492, -7.09536075592041, -6.824238300323486, -6.5531158447265625, -6.2819929122924805, -6.010870456695557, -5.739748001098633, -5.468625068664551, -5.197502613067627, -4.926380157470703, -4.655257225036621, -4.384134769439697, -4.113012313842773, -3.8418893814086914, -3.5707666873931885, -3.2996439933776855, -3.0285215377807617, -2.757398843765259, -2.486276149749756, -2.215153694152832, -1.944031000137329, -1.6729083061218262, -1.4017856121063232, -1.1306630373001099, -0.8595404028892517, -0.5884177684783936, -0.3172950744628906, -0.046172499656677246, 0.22495007514953613, 0.49607372283935547, 0.7671963572502136, 1.0383189916610718, 1.3094415664672852, 1.580564260482788, 1.851686954498291, 2.122809410095215, 2.3939321041107178, 2.6650547981262207, 2.9361774921417236, 3.2073001861572266, 3.4784226417541504, 3.7495453357696533, 4.020668029785156, 4.29179048538208, 4.562912940979004, 4.834035873413086, 5.10515832901001, 5.376281261444092, 5.647403717041016, 5.918526649475098, 6.1896491050720215, 6.460771560668945, 6.731894493103027, 7.003016948699951, 7.274139404296875, 7.545262336730957, 7.816384792327881, 8.087507247924805, 8.358630180358887, 8.629753112792969, 8.900875091552734, 9.171998023986816]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 6.0, 6.0, 9.0, 15.0, 16.0, 28.0, 48.0, 70.0, 108.0, 137.0, 252.0, 458.0, 953.0, 2457.0, 8546.0, 58228.0, 4016910.0, 89962.0, 10814.0, 2899.0, 1081.0, 471.0, 282.0, 180.0, 109.0, 68.0, 43.0, 38.0, 25.0, 19.0, 12.0, 6.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.2734375, -2.2076873779296875, -2.141937255859375, -2.0761871337890625, -2.01043701171875, -1.9446868896484375, -1.878936767578125, -1.8131866455078125, -1.7474365234375, -1.6816864013671875, -1.615936279296875, -1.5501861572265625, -1.48443603515625, -1.4186859130859375, -1.352935791015625, -1.2871856689453125, -1.221435546875, -1.1556854248046875, -1.089935302734375, -1.0241851806640625, -0.95843505859375, -0.8926849365234375, -0.826934814453125, -0.7611846923828125, -0.6954345703125, -0.6296844482421875, -0.563934326171875, -0.4981842041015625, -0.43243408203125, -0.3666839599609375, -0.300933837890625, -0.2351837158203125, -0.16943359375, -0.1036834716796875, -0.037933349609375, 0.0278167724609375, 0.09356689453125, 0.1593170166015625, 0.225067138671875, 0.2908172607421875, 0.3565673828125, 0.4223175048828125, 0.488067626953125, 0.5538177490234375, 0.61956787109375, 0.6853179931640625, 0.751068115234375, 0.8168182373046875, 0.882568359375, 0.9483184814453125, 1.014068603515625, 1.0798187255859375, 1.14556884765625, 1.2113189697265625, 1.277069091796875, 1.3428192138671875, 1.4085693359375, 1.4743194580078125, 1.540069580078125, 1.6058197021484375, 1.67156982421875, 1.7373199462890625, 1.803070068359375, 1.8688201904296875, 1.9345703125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 9.0, 5.0, 16.0, 18.0, 21.0, 23.0, 50.0, 65.0, 78.0, 91.0, 98.0, 95.0, 99.0, 69.0, 61.0, 67.0, 45.0, 32.0, 17.0, 11.0, 12.0, 2.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86865234375, -0.8459091186523438, -0.8231658935546875, -0.8004226684570312, -0.777679443359375, -0.7549362182617188, -0.7321929931640625, -0.7094497680664062, -0.68670654296875, -0.6639633178710938, -0.6412200927734375, -0.6184768676757812, -0.595733642578125, -0.5729904174804688, -0.5502471923828125, -0.5275039672851562, -0.5047607421875, -0.48201751708984375, -0.4592742919921875, -0.43653106689453125, -0.413787841796875, -0.39104461669921875, -0.3683013916015625, -0.34555816650390625, -0.32281494140625, -0.30007171630859375, -0.2773284912109375, -0.25458526611328125, -0.231842041015625, -0.20909881591796875, -0.1863555908203125, -0.16361236572265625, -0.140869140625, -0.11812591552734375, -0.0953826904296875, -0.07263946533203125, -0.049896240234375, -0.02715301513671875, -0.0044097900390625, 0.01833343505859375, 0.04107666015625, 0.06381988525390625, 0.0865631103515625, 0.10930633544921875, 0.132049560546875, 0.15479278564453125, 0.1775360107421875, 0.20027923583984375, 0.2230224609375, 0.24576568603515625, 0.2685089111328125, 0.29125213623046875, 0.313995361328125, 0.33673858642578125, 0.3594818115234375, 0.38222503662109375, 0.40496826171875, 0.42771148681640625, 0.4504547119140625, 0.47319793701171875, 0.495941162109375, 0.5186843872070312, 0.5414276123046875, 0.5641708374023438, 0.5869140625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 8.0, 9.0, 14.0, 18.0, 32.0, 39.0, 71.0, 111.0, 178.0, 299.0, 498.0, 801.0, 1714.0, 3754.0, 11169.0, 51464.0, 3687395.0, 391648.0, 31221.0, 7870.0, 2814.0, 1329.0, 705.0, 439.0, 239.0, 147.0, 95.0, 65.0, 47.0, 35.0, 23.0, 12.0, 8.0, 7.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.494140625, -1.4405059814453125, -1.386871337890625, -1.3332366943359375, -1.27960205078125, -1.2259674072265625, -1.172332763671875, -1.1186981201171875, -1.0650634765625, -1.0114288330078125, -0.957794189453125, -0.9041595458984375, -0.85052490234375, -0.7968902587890625, -0.743255615234375, -0.6896209716796875, -0.635986328125, -0.5823516845703125, -0.528717041015625, -0.4750823974609375, -0.42144775390625, -0.3678131103515625, -0.314178466796875, -0.2605438232421875, -0.2069091796875, -0.1532745361328125, -0.099639892578125, -0.0460052490234375, 0.00762939453125, 0.0612640380859375, 0.114898681640625, 0.1685333251953125, 0.22216796875, 0.2758026123046875, 0.329437255859375, 0.3830718994140625, 0.43670654296875, 0.4903411865234375, 0.543975830078125, 0.5976104736328125, 0.6512451171875, 0.7048797607421875, 0.758514404296875, 0.8121490478515625, 0.86578369140625, 0.9194183349609375, 0.973052978515625, 1.0266876220703125, 1.080322265625, 1.1339569091796875, 1.187591552734375, 1.2412261962890625, 1.29486083984375, 1.3484954833984375, 1.402130126953125, 1.4557647705078125, 1.5093994140625, 1.5630340576171875, 1.616668701171875, 1.6703033447265625, 1.72393798828125, 1.7775726318359375, 1.831207275390625, 1.8848419189453125, 1.9384765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 10.0, 6.0, 18.0, 20.0, 31.0, 79.0, 145.0, 662.0, 2697.0, 197.0, 90.0, 48.0, 24.0, 16.0, 11.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.97412109375, -0.9471664428710938, -0.9202117919921875, -0.8932571411132812, -0.866302490234375, -0.8393478393554688, -0.8123931884765625, -0.7854385375976562, -0.75848388671875, -0.7315292358398438, -0.7045745849609375, -0.6776199340820312, -0.650665283203125, -0.6237106323242188, -0.5967559814453125, -0.5698013305664062, -0.5428466796875, -0.5158920288085938, -0.4889373779296875, -0.46198272705078125, -0.435028076171875, -0.40807342529296875, -0.3811187744140625, -0.35416412353515625, -0.32720947265625, -0.30025482177734375, -0.2733001708984375, -0.24634552001953125, -0.219390869140625, -0.19243621826171875, -0.1654815673828125, -0.13852691650390625, -0.111572265625, -0.08461761474609375, -0.0576629638671875, -0.03070831298828125, -0.003753662109375, 0.02320098876953125, 0.0501556396484375, 0.07711029052734375, 0.10406494140625, 0.13101959228515625, 0.1579742431640625, 0.18492889404296875, 0.211883544921875, 0.23883819580078125, 0.2657928466796875, 0.29274749755859375, 0.3197021484375, 0.34665679931640625, 0.3736114501953125, 0.40056610107421875, 0.427520751953125, 0.45447540283203125, 0.4814300537109375, 0.5083847045898438, 0.53533935546875, 0.5622940063476562, 0.5892486572265625, 0.6162033081054688, 0.643157958984375, 0.6701126098632812, 0.6970672607421875, 0.7240219116210938, 0.7509765625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 9.0, 14.0, 44.0, 54.0, 120.0, 195.0, 200.0, 173.0, 99.0, 49.0, 29.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.250251531600952, -3.105616331100464, -2.9609808921813965, -2.816345691680908, -2.671710252761841, -2.5270750522613525, -2.382439613342285, -2.237804412841797, -2.0931692123413086, -1.9485338926315308, -1.803898572921753, -1.6592633724212646, -1.5146279335021973, -1.369992733001709, -1.2253574132919312, -1.0807220935821533, -0.9360866546630859, -0.7914513349533081, -0.6468160152435303, -0.5021807551383972, -0.3575454354286194, -0.21291011571884155, -0.0682748556137085, 0.07636046409606934, 0.22099578380584717, 0.365631103515625, 0.5102664232254028, 0.6549016833305359, 0.7995370030403137, 0.9441723227500916, 1.0888075828552246, 1.2334429025650024, 1.3780779838562012, 1.522713303565979, 1.6673486232757568, 1.8119838237762451, 1.9566192626953125, 2.101254463195801, 2.245889663696289, 2.3905251026153564, 2.535160541534424, 2.679795742034912, 2.8244311809539795, 2.9690663814544678, 3.113701820373535, 3.2583370208740234, 3.4029722213745117, 3.547607660293579, 3.6922428607940674, 3.8368780612945557, 3.981513500213623, 4.126148700714111, 4.2707839012146, 4.415419578552246, 4.560054779052734, 4.704689979553223, 4.849325180053711, 4.993960380554199, 5.1385955810546875, 5.283231258392334, 5.427866458892822, 5.5725016593933105, 5.717136859893799, 5.861772537231445, 6.006407737731934]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 5.0, 7.0, 11.0, 13.0, 21.0, 17.0, 27.0, 19.0, 18.0, 31.0, 27.0, 41.0, 40.0, 36.0, 45.0, 53.0, 50.0, 40.0, 52.0, 40.0, 33.0, 51.0, 47.0, 41.0, 28.0, 30.0, 29.0, 21.0, 23.0, 22.0, 13.0, 13.0, 11.0, 9.0, 5.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.692967176437378, -1.6411323547363281, -1.5892975330352783, -1.5374627113342285, -1.4856278896331787, -1.433793067932129, -1.381958246231079, -1.3301235437393188, -1.278288722038269, -1.2264539003372192, -1.1746190786361694, -1.1227842569351196, -1.0709494352340698, -1.0191147327423096, -0.967279851436615, -0.91544508934021, -0.8636102080345154, -0.8117753863334656, -0.7599405646324158, -0.7081058025360107, -0.6562709808349609, -0.6044361591339111, -0.5526013374328613, -0.5007665157318115, -0.4489317238330841, -0.3970969021320343, -0.3452621102333069, -0.2934272885322571, -0.24159248173236847, -0.18975767493247986, -0.13792285323143005, -0.08608806133270264, -0.03425323963165283, 0.017581570893526077, 0.06941638141870499, 0.1212511956691742, 0.1730860024690628, 0.22492080926895142, 0.2767556309700012, 0.32859042286872864, 0.38042524456977844, 0.43226006627082825, 0.48409485816955566, 0.5359296798706055, 0.5877645015716553, 0.6395993232727051, 0.6914341449737549, 0.7432689070701599, 0.7951037287712097, 0.8469385504722595, 0.8987733721733093, 0.9506081342697144, 1.0024429559707642, 1.054277777671814, 1.1061125993728638, 1.1579474210739136, 1.2097822427749634, 1.2616170644760132, 1.313451886177063, 1.3652867078781128, 1.4171215295791626, 1.4689562320709229, 1.5207910537719727, 1.5726258754730225, 1.6244606971740723]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 9.0, 15.0, 12.0, 27.0, 51.0, 73.0, 132.0, 270.0, 575.0, 1369.0, 4109.0, 16229.0, 92156.0, 474471.0, 376450.0, 64743.0, 12451.0, 3299.0, 1123.0, 483.0, 212.0, 100.0, 73.0, 37.0, 32.0, 16.0, 11.0, 10.0, 4.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9892578125, -1.9381256103515625, -1.886993408203125, -1.8358612060546875, -1.78472900390625, -1.7335968017578125, -1.682464599609375, -1.6313323974609375, -1.5802001953125, -1.5290679931640625, -1.477935791015625, -1.4268035888671875, -1.37567138671875, -1.3245391845703125, -1.273406982421875, -1.2222747802734375, -1.171142578125, -1.1200103759765625, -1.068878173828125, -1.0177459716796875, -0.96661376953125, -0.9154815673828125, -0.864349365234375, -0.8132171630859375, -0.7620849609375, -0.7109527587890625, -0.659820556640625, -0.6086883544921875, -0.55755615234375, -0.5064239501953125, -0.455291748046875, -0.4041595458984375, -0.35302734375, -0.3018951416015625, -0.250762939453125, -0.1996307373046875, -0.14849853515625, -0.0973663330078125, -0.046234130859375, 0.0048980712890625, 0.0560302734375, 0.1071624755859375, 0.158294677734375, 0.2094268798828125, 0.26055908203125, 0.3116912841796875, 0.362823486328125, 0.4139556884765625, 0.465087890625, 0.5162200927734375, 0.567352294921875, 0.6184844970703125, 0.66961669921875, 0.7207489013671875, 0.771881103515625, 0.8230133056640625, 0.8741455078125, 0.9252777099609375, 0.976409912109375, 1.0275421142578125, 1.07867431640625, 1.1298065185546875, 1.180938720703125, 1.2320709228515625, 1.283203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 4.0, 4.0, 7.0, 8.0, 11.0, 15.0, 19.0, 27.0, 27.0, 51.0, 61.0, 58.0, 83.0, 57.0, 84.0, 83.0, 64.0, 64.0, 64.0, 46.0, 49.0, 27.0, 27.0, 21.0, 9.0, 6.0, 8.0, 5.0, 2.0, 6.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69921875, -0.679656982421875, -0.66009521484375, -0.640533447265625, -0.6209716796875, -0.601409912109375, -0.58184814453125, -0.562286376953125, -0.542724609375, -0.523162841796875, -0.50360107421875, -0.484039306640625, -0.4644775390625, -0.444915771484375, -0.42535400390625, -0.405792236328125, -0.38623046875, -0.366668701171875, -0.34710693359375, -0.327545166015625, -0.3079833984375, -0.288421630859375, -0.26885986328125, -0.249298095703125, -0.229736328125, -0.210174560546875, -0.19061279296875, -0.171051025390625, -0.1514892578125, -0.131927490234375, -0.11236572265625, -0.092803955078125, -0.0732421875, -0.053680419921875, -0.03411865234375, -0.014556884765625, 0.0050048828125, 0.024566650390625, 0.04412841796875, 0.063690185546875, 0.083251953125, 0.102813720703125, 0.12237548828125, 0.141937255859375, 0.1614990234375, 0.181060791015625, 0.20062255859375, 0.220184326171875, 0.23974609375, 0.259307861328125, 0.27886962890625, 0.298431396484375, 0.3179931640625, 0.337554931640625, 0.35711669921875, 0.376678466796875, 0.396240234375, 0.415802001953125, 0.43536376953125, 0.454925537109375, 0.4744873046875, 0.494049072265625, 0.51361083984375, 0.533172607421875, 0.552734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 5.0, 6.0, 3.0, 8.0, 19.0, 19.0, 32.0, 52.0, 62.0, 124.0, 188.0, 295.0, 626.0, 1189.0, 3109.0, 10738.0, 79137.0, 650900.0, 267179.0, 25946.0, 5216.0, 1800.0, 794.0, 420.0, 254.0, 132.0, 101.0, 69.0, 41.0, 27.0, 27.0, 15.0, 4.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.390655517578125, -1.33209228515625, -1.273529052734375, -1.2149658203125, -1.156402587890625, -1.09783935546875, -1.039276123046875, -0.980712890625, -0.922149658203125, -0.86358642578125, -0.805023193359375, -0.7464599609375, -0.687896728515625, -0.62933349609375, -0.570770263671875, -0.51220703125, -0.453643798828125, -0.39508056640625, -0.336517333984375, -0.2779541015625, -0.219390869140625, -0.16082763671875, -0.102264404296875, -0.043701171875, 0.014862060546875, 0.07342529296875, 0.131988525390625, 0.1905517578125, 0.249114990234375, 0.30767822265625, 0.366241455078125, 0.4248046875, 0.483367919921875, 0.54193115234375, 0.600494384765625, 0.6590576171875, 0.717620849609375, 0.77618408203125, 0.834747314453125, 0.893310546875, 0.951873779296875, 1.01043701171875, 1.069000244140625, 1.1275634765625, 1.186126708984375, 1.24468994140625, 1.303253173828125, 1.36181640625, 1.420379638671875, 1.47894287109375, 1.537506103515625, 1.5960693359375, 1.654632568359375, 1.71319580078125, 1.771759033203125, 1.830322265625, 1.888885498046875, 1.94744873046875, 2.006011962890625, 2.0645751953125, 2.123138427734375, 2.18170166015625, 2.240264892578125, 2.298828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 1.0, 7.0, 15.0, 10.0, 17.0, 23.0, 28.0, 35.0, 27.0, 31.0, 34.0, 38.0, 42.0, 47.0, 52.0, 60.0, 42.0, 49.0, 69.0, 51.0, 39.0, 48.0, 41.0, 31.0, 21.0, 26.0, 26.0, 16.0, 13.0, 9.0, 7.0, 11.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8125, -1.7547454833984375, -1.696990966796875, -1.6392364501953125, -1.58148193359375, -1.5237274169921875, -1.465972900390625, -1.4082183837890625, -1.3504638671875, -1.2927093505859375, -1.234954833984375, -1.1772003173828125, -1.11944580078125, -1.0616912841796875, -1.003936767578125, -0.9461822509765625, -0.888427734375, -0.8306732177734375, -0.772918701171875, -0.7151641845703125, -0.65740966796875, -0.5996551513671875, -0.541900634765625, -0.4841461181640625, -0.4263916015625, -0.3686370849609375, -0.310882568359375, -0.2531280517578125, -0.19537353515625, -0.1376190185546875, -0.079864501953125, -0.0221099853515625, 0.03564453125, 0.0933990478515625, 0.151153564453125, 0.2089080810546875, 0.26666259765625, 0.3244171142578125, 0.382171630859375, 0.4399261474609375, 0.4976806640625, 0.5554351806640625, 0.613189697265625, 0.6709442138671875, 0.72869873046875, 0.7864532470703125, 0.844207763671875, 0.9019622802734375, 0.959716796875, 1.0174713134765625, 1.075225830078125, 1.1329803466796875, 1.19073486328125, 1.2484893798828125, 1.306243896484375, 1.3639984130859375, 1.4217529296875, 1.4795074462890625, 1.537261962890625, 1.5950164794921875, 1.65277099609375, 1.7105255126953125, 1.768280029296875, 1.8260345458984375, 1.8837890625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 12.0, 9.0, 35.0, 39.0, 62.0, 77.0, 143.0, 299.0, 728.0, 1919.0, 8126.0, 90707.0, 794700.0, 136975.0, 10796.0, 2300.0, 796.0, 357.0, 184.0, 91.0, 49.0, 35.0, 15.0, 19.0, 16.0, 19.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.95361328125, -0.9275360107421875, -0.901458740234375, -0.8753814697265625, -0.84930419921875, -0.8232269287109375, -0.797149658203125, -0.7710723876953125, -0.7449951171875, -0.7189178466796875, -0.692840576171875, -0.6667633056640625, -0.64068603515625, -0.6146087646484375, -0.588531494140625, -0.5624542236328125, -0.536376953125, -0.5102996826171875, -0.484222412109375, -0.4581451416015625, -0.43206787109375, -0.4059906005859375, -0.379913330078125, -0.3538360595703125, -0.3277587890625, -0.3016815185546875, -0.275604248046875, -0.2495269775390625, -0.22344970703125, -0.1973724365234375, -0.171295166015625, -0.1452178955078125, -0.119140625, -0.0930633544921875, -0.066986083984375, -0.0409088134765625, -0.01483154296875, 0.0112457275390625, 0.037322998046875, 0.0634002685546875, 0.0894775390625, 0.1155548095703125, 0.141632080078125, 0.1677093505859375, 0.19378662109375, 0.2198638916015625, 0.245941162109375, 0.2720184326171875, 0.298095703125, 0.3241729736328125, 0.350250244140625, 0.3763275146484375, 0.40240478515625, 0.4284820556640625, 0.454559326171875, 0.4806365966796875, 0.5067138671875, 0.5327911376953125, 0.558868408203125, 0.5849456787109375, 0.61102294921875, 0.6371002197265625, 0.663177490234375, 0.6892547607421875, 0.71533203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 1.0, 5.0, 10.0, 10.0, 16.0, 13.0, 23.0, 34.0, 42.0, 56.0, 64.0, 90.0, 89.0, 83.0, 94.0, 75.0, 68.0, 53.0, 47.0, 40.0, 24.0, 18.0, 15.0, 5.0, 3.0, 5.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.893013000488281e-05, -8.591823279857635e-05, -8.29063355922699e-05, -7.989443838596344e-05, -7.688254117965698e-05, -7.387064397335052e-05, -7.085874676704407e-05, -6.784684956073761e-05, -6.483495235443115e-05, -6.18230551481247e-05, -5.881115794181824e-05, -5.579926073551178e-05, -5.278736352920532e-05, -4.9775466322898865e-05, -4.676356911659241e-05, -4.375167191028595e-05, -4.073977470397949e-05, -3.7727877497673035e-05, -3.471598029136658e-05, -3.170408308506012e-05, -2.8692185878753662e-05, -2.5680288672447205e-05, -2.2668391466140747e-05, -1.965649425983429e-05, -1.6644597053527832e-05, -1.3632699847221375e-05, -1.0620802640914917e-05, -7.6089054346084595e-06, -4.597008228302002e-06, -1.5851110219955444e-06, 1.426786184310913e-06, 4.438683390617371e-06, 7.450580596923828e-06, 1.0462477803230286e-05, 1.3474375009536743e-05, 1.64862722158432e-05, 1.9498169422149658e-05, 2.2510066628456116e-05, 2.5521963834762573e-05, 2.853386104106903e-05, 3.154575824737549e-05, 3.4557655453681946e-05, 3.75695526599884e-05, 4.058144986629486e-05, 4.359334707260132e-05, 4.6605244278907776e-05, 4.9617141485214233e-05, 5.262903869152069e-05, 5.564093589782715e-05, 5.8652833104133606e-05, 6.166473031044006e-05, 6.467662751674652e-05, 6.768852472305298e-05, 7.070042192935944e-05, 7.37123191356659e-05, 7.672421634197235e-05, 7.973611354827881e-05, 8.274801075458527e-05, 8.575990796089172e-05, 8.877180516719818e-05, 9.178370237350464e-05, 9.47955995798111e-05, 9.780749678611755e-05, 0.00010081939399242401, 0.00010383129119873047]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 14.0, 21.0, 21.0, 27.0, 63.0, 128.0, 229.0, 539.0, 1616.0, 6302.0, 74121.0, 838598.0, 115823.0, 8044.0, 1763.0, 669.0, 259.0, 129.0, 71.0, 44.0, 29.0, 14.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8349609375, -0.8046722412109375, -0.774383544921875, -0.7440948486328125, -0.71380615234375, -0.6835174560546875, -0.653228759765625, -0.6229400634765625, -0.5926513671875, -0.5623626708984375, -0.532073974609375, -0.5017852783203125, -0.47149658203125, -0.4412078857421875, -0.410919189453125, -0.3806304931640625, -0.350341796875, -0.3200531005859375, -0.289764404296875, -0.2594757080078125, -0.22918701171875, -0.1988983154296875, -0.168609619140625, -0.1383209228515625, -0.1080322265625, -0.0777435302734375, -0.047454833984375, -0.0171661376953125, 0.01312255859375, 0.0434112548828125, 0.073699951171875, 0.1039886474609375, 0.13427734375, 0.1645660400390625, 0.194854736328125, 0.2251434326171875, 0.25543212890625, 0.2857208251953125, 0.316009521484375, 0.3462982177734375, 0.3765869140625, 0.4068756103515625, 0.437164306640625, 0.4674530029296875, 0.49774169921875, 0.5280303955078125, 0.558319091796875, 0.5886077880859375, 0.618896484375, 0.6491851806640625, 0.679473876953125, 0.7097625732421875, 0.74005126953125, 0.7703399658203125, 0.800628662109375, 0.8309173583984375, 0.8612060546875, 0.8914947509765625, 0.921783447265625, 0.9520721435546875, 0.98236083984375, 1.0126495361328125, 1.042938232421875, 1.0732269287109375, 1.103515625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 8.0, 14.0, 16.0, 26.0, 24.0, 36.0, 47.0, 52.0, 58.0, 69.0, 77.0, 84.0, 87.0, 86.0, 66.0, 67.0, 38.0, 32.0, 37.0, 23.0, 15.0, 10.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78466796875, -0.7642059326171875, -0.743743896484375, -0.7232818603515625, -0.70281982421875, -0.6823577880859375, -0.661895751953125, -0.6414337158203125, -0.6209716796875, -0.6005096435546875, -0.580047607421875, -0.5595855712890625, -0.53912353515625, -0.5186614990234375, -0.498199462890625, -0.4777374267578125, -0.457275390625, -0.4368133544921875, -0.416351318359375, -0.3958892822265625, -0.37542724609375, -0.3549652099609375, -0.334503173828125, -0.3140411376953125, -0.2935791015625, -0.2731170654296875, -0.252655029296875, -0.2321929931640625, -0.21173095703125, -0.1912689208984375, -0.170806884765625, -0.1503448486328125, -0.1298828125, -0.1094207763671875, -0.088958740234375, -0.0684967041015625, -0.04803466796875, -0.0275726318359375, -0.007110595703125, 0.0133514404296875, 0.0338134765625, 0.0542755126953125, 0.074737548828125, 0.0951995849609375, 0.11566162109375, 0.1361236572265625, 0.156585693359375, 0.1770477294921875, 0.197509765625, 0.2179718017578125, 0.238433837890625, 0.2588958740234375, 0.27935791015625, 0.2998199462890625, 0.320281982421875, 0.3407440185546875, 0.3612060546875, 0.3816680908203125, 0.402130126953125, 0.4225921630859375, 0.44305419921875, 0.4635162353515625, 0.483978271484375, 0.5044403076171875, 0.52490234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 8.0, 8.0, 15.0, 31.0, 43.0, 87.0, 112.0, 166.0, 153.0, 145.0, 102.0, 60.0, 33.0, 13.0, 11.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-21.54706573486328, -21.114044189453125, -20.6810245513916, -20.248003005981445, -19.81498146057129, -19.381959915161133, -18.94894027709961, -18.515918731689453, -18.082897186279297, -17.64987564086914, -17.216856002807617, -16.78383445739746, -16.350812911987305, -15.917792320251465, -15.484770774841309, -15.051750183105469, -14.618728637695312, -14.185708045959473, -13.752686500549316, -13.319665908813477, -12.88664436340332, -12.45362377166748, -12.020602226257324, -11.587581634521484, -11.154561042785645, -10.721540451049805, -10.288518905639648, -9.855498313903809, -9.422476768493652, -8.989456176757812, -8.556434631347656, -8.123414039611816, -7.690392971038818, -7.25737190246582, -6.824350833892822, -6.391329765319824, -5.958308696746826, -5.525287628173828, -5.092267036437988, -4.659245491027832, -4.226224899291992, -3.793203830718994, -3.360182762145996, -2.927161693572998, -2.494140625, -2.061119794845581, -1.628098726272583, -1.195077657699585, -0.7620563507080078, -0.32903531193733215, 0.1039857268333435, 0.5370067358016968, 0.9700278043746948, 1.4030487537384033, 1.8360698223114014, 2.2690908908843994, 2.7021119594573975, 3.1351330280303955, 3.5681540966033936, 4.0011749267578125, 4.4341959953308105, 4.867217063903809, 5.300238132476807, 5.733259201049805, 6.166280269622803]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 2.0, 3.0, 3.0, 5.0, 6.0, 11.0, 9.0, 18.0, 21.0, 15.0, 16.0, 24.0, 28.0, 38.0, 32.0, 35.0, 26.0, 40.0, 44.0, 46.0, 54.0, 43.0, 53.0, 40.0, 46.0, 34.0, 46.0, 44.0, 24.0, 39.0, 22.0, 25.0, 16.0, 12.0, 16.0, 9.0, 12.0, 9.0, 5.0, 8.0, 5.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.958752155303955, -6.720723628997803, -6.482695579528809, -6.244667053222656, -6.006638526916504, -5.768610000610352, -5.530581474304199, -5.292553424835205, -5.054524898529053, -4.8164963722229, -4.578468322753906, -4.340439796447754, -4.102411270141602, -3.864382743835449, -3.626354455947876, -3.3883261680603027, -3.1502976417541504, -2.912269115447998, -2.674240827560425, -2.4362125396728516, -2.198184013366699, -1.9601556062698364, -1.7221271991729736, -1.4840987920761108, -1.246070384979248, -1.0080419778823853, -0.7700135707855225, -0.5319851636886597, -0.2939567565917969, -0.05592834949493408, 0.1821000576019287, 0.4201284646987915, 0.6581573486328125, 0.8961857557296753, 1.134214162826538, 1.3722425699234009, 1.6102709770202637, 1.8482993841171265, 2.0863277912139893, 2.3243560791015625, 2.562384605407715, 2.800413131713867, 3.0384414196014404, 3.2764697074890137, 3.514498233795166, 3.7525267601013184, 3.9905550479888916, 4.228583335876465, 4.466611862182617, 4.7046403884887695, 4.942668914794922, 5.180696964263916, 5.418725490570068, 5.656754016876221, 5.894782066345215, 6.132810592651367, 6.3708391189575195, 6.608867645263672, 6.846896171569824, 7.084924221038818, 7.322952747344971, 7.560981273651123, 7.799009323120117, 8.03703784942627, 8.275066375732422]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 14.0, 23.0, 32.0, 45.0, 71.0, 94.0, 174.0, 353.0, 856.0, 2098.0, 5815.0, 19371.0, 91700.0, 1724204.0, 2216325.0, 101744.0, 20630.0, 6255.0, 2293.0, 1011.0, 501.0, 245.0, 129.0, 86.0, 51.0, 35.0, 28.0, 25.0, 8.0, 7.0, 6.0, 10.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.24609375, -1.2115097045898438, -1.1769256591796875, -1.1423416137695312, -1.107757568359375, -1.0731735229492188, -1.0385894775390625, -1.0040054321289062, -0.96942138671875, -0.9348373413085938, -0.9002532958984375, -0.8656692504882812, -0.831085205078125, -0.7965011596679688, -0.7619171142578125, -0.7273330688476562, -0.6927490234375, -0.6581649780273438, -0.6235809326171875, -0.5889968872070312, -0.554412841796875, -0.5198287963867188, -0.4852447509765625, -0.45066070556640625, -0.41607666015625, -0.38149261474609375, -0.3469085693359375, -0.31232452392578125, -0.277740478515625, -0.24315643310546875, -0.2085723876953125, -0.17398834228515625, -0.139404296875, -0.10482025146484375, -0.0702362060546875, -0.03565216064453125, -0.001068115234375, 0.03351593017578125, 0.0680999755859375, 0.10268402099609375, 0.13726806640625, 0.17185211181640625, 0.2064361572265625, 0.24102020263671875, 0.275604248046875, 0.31018829345703125, 0.3447723388671875, 0.37935638427734375, 0.4139404296875, 0.44852447509765625, 0.4831085205078125, 0.5176925659179688, 0.552276611328125, 0.5868606567382812, 0.6214447021484375, 0.6560287475585938, 0.69061279296875, 0.7251968383789062, 0.7597808837890625, 0.7943649291992188, 0.828948974609375, 0.8635330200195312, 0.8981170654296875, 0.9327011108398438, 0.96728515625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 11.0, 8.0, 17.0, 10.0, 9.0, 26.0, 27.0, 27.0, 35.0, 43.0, 46.0, 60.0, 56.0, 61.0, 68.0, 57.0, 66.0, 55.0, 54.0, 33.0, 46.0, 37.0, 31.0, 25.0, 22.0, 15.0, 15.0, 7.0, 6.0, 6.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.3655204772949219, -0.35189056396484375, -0.3382606506347656, -0.3246307373046875, -0.3110008239746094, -0.29737091064453125, -0.2837409973144531, -0.270111083984375, -0.2564811706542969, -0.24285125732421875, -0.22922134399414062, -0.2155914306640625, -0.20196151733398438, -0.18833160400390625, -0.17470169067382812, -0.16107177734375, -0.14744186401367188, -0.13381195068359375, -0.12018203735351562, -0.1065521240234375, -0.09292221069335938, -0.07929229736328125, -0.06566238403320312, -0.052032470703125, -0.038402557373046875, -0.02477264404296875, -0.011142730712890625, 0.0024871826171875, 0.016117095947265625, 0.02974700927734375, 0.043376922607421875, 0.0570068359375, 0.07063674926757812, 0.08426666259765625, 0.09789657592773438, 0.1115264892578125, 0.12515640258789062, 0.13878631591796875, 0.15241622924804688, 0.166046142578125, 0.17967605590820312, 0.19330596923828125, 0.20693588256835938, 0.2205657958984375, 0.23419570922851562, 0.24782562255859375, 0.2614555358886719, 0.27508544921875, 0.2887153625488281, 0.30234527587890625, 0.3159751892089844, 0.3296051025390625, 0.3432350158691406, 0.35686492919921875, 0.3704948425292969, 0.384124755859375, 0.3977546691894531, 0.41138458251953125, 0.4250144958496094, 0.4386444091796875, 0.4522743225097656, 0.46590423583984375, 0.4795341491699219, 0.4931640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 9.0, 20.0, 24.0, 58.0, 119.0, 262.0, 834.0, 3716.0, 33525.0, 3267053.0, 864748.0, 19970.0, 2709.0, 741.0, 272.0, 110.0, 42.0, 17.0, 17.0, 10.0, 11.0, 7.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08203125, -2.009979248046875, -1.93792724609375, -1.865875244140625, -1.7938232421875, -1.721771240234375, -1.64971923828125, -1.577667236328125, -1.505615234375, -1.433563232421875, -1.36151123046875, -1.289459228515625, -1.2174072265625, -1.145355224609375, -1.07330322265625, -1.001251220703125, -0.92919921875, -0.857147216796875, -0.78509521484375, -0.713043212890625, -0.6409912109375, -0.568939208984375, -0.49688720703125, -0.424835205078125, -0.352783203125, -0.280731201171875, -0.20867919921875, -0.136627197265625, -0.0645751953125, 0.007476806640625, 0.07952880859375, 0.151580810546875, 0.2236328125, 0.295684814453125, 0.36773681640625, 0.439788818359375, 0.5118408203125, 0.583892822265625, 0.65594482421875, 0.727996826171875, 0.800048828125, 0.872100830078125, 0.94415283203125, 1.016204833984375, 1.0882568359375, 1.160308837890625, 1.23236083984375, 1.304412841796875, 1.37646484375, 1.448516845703125, 1.52056884765625, 1.592620849609375, 1.6646728515625, 1.736724853515625, 1.80877685546875, 1.880828857421875, 1.952880859375, 2.024932861328125, 2.09698486328125, 2.169036865234375, 2.2410888671875, 2.313140869140625, 2.38519287109375, 2.457244873046875, 2.529296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 13.0, 23.0, 37.0, 84.0, 164.0, 424.0, 1120.0, 1330.0, 481.0, 174.0, 91.0, 50.0, 24.0, 15.0, 13.0, 8.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.3443756103515625, -1.283477783203125, -1.2225799560546875, -1.16168212890625, -1.1007843017578125, -1.039886474609375, -0.9789886474609375, -0.9180908203125, -0.8571929931640625, -0.796295166015625, -0.7353973388671875, -0.67449951171875, -0.6136016845703125, -0.552703857421875, -0.4918060302734375, -0.430908203125, -0.3700103759765625, -0.309112548828125, -0.2482147216796875, -0.18731689453125, -0.1264190673828125, -0.065521240234375, -0.0046234130859375, 0.0562744140625, 0.1171722412109375, 0.178070068359375, 0.2389678955078125, 0.29986572265625, 0.3607635498046875, 0.421661376953125, 0.4825592041015625, 0.54345703125, 0.6043548583984375, 0.665252685546875, 0.7261505126953125, 0.78704833984375, 0.8479461669921875, 0.908843994140625, 0.9697418212890625, 1.0306396484375, 1.0915374755859375, 1.152435302734375, 1.2133331298828125, 1.27423095703125, 1.3351287841796875, 1.396026611328125, 1.4569244384765625, 1.517822265625, 1.5787200927734375, 1.639617919921875, 1.7005157470703125, 1.76141357421875, 1.8223114013671875, 1.883209228515625, 1.9441070556640625, 2.0050048828125, 2.0659027099609375, 2.126800537109375, 2.1876983642578125, 2.24859619140625, 2.3094940185546875, 2.370391845703125, 2.4312896728515625, 2.4921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 17.0, 39.0, 90.0, 195.0, 192.0, 199.0, 131.0, 55.0, 27.0, 13.0, 17.0, 7.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.360735893249512, -8.938557624816895, -8.516378402709961, -8.094200134277344, -7.672021865844727, -7.249843120574951, -6.827664375305176, -6.405486106872559, -5.983307361602783, -5.561128616333008, -5.138950347900391, -4.716771602630615, -4.29459285736084, -3.8724145889282227, -3.4502358436584473, -3.028057336807251, -2.6058788299560547, -2.1837003231048584, -1.7615216970443726, -1.3393430709838867, -0.9171645641326904, -0.49498605728149414, -0.07280731201171875, 0.34937119483947754, 0.7715497016906738, 1.1937282085418701, 1.615906834602356, 2.038085460662842, 2.460263967514038, 2.8824424743652344, 3.3046212196350098, 3.726799726486206, 4.148977279663086, 4.571156024932861, 4.9933342933654785, 5.415513038635254, 5.837691307067871, 6.2598700523376465, 6.682048797607422, 7.104227066040039, 7.5264058113098145, 7.94858455657959, 8.370762825012207, 8.79294204711914, 9.215120315551758, 9.637298583984375, 10.059476852416992, 10.481656074523926, 10.903834342956543, 11.32601261138916, 11.748191833496094, 12.170370101928711, 12.592548370361328, 13.014726638793945, 13.436905860900879, 13.859084129333496, 14.28126335144043, 14.703441619873047, 15.12562084197998, 15.547799110412598, 15.969977378845215, 16.39215660095215, 16.814334869384766, 17.236513137817383, 17.65869140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 4.0, 8.0, 13.0, 27.0, 20.0, 31.0, 24.0, 33.0, 29.0, 33.0, 30.0, 46.0, 37.0, 48.0, 38.0, 50.0, 42.0, 38.0, 31.0, 44.0, 42.0, 41.0, 45.0, 24.0, 35.0, 30.0, 28.0, 18.0, 13.0, 14.0, 15.0, 9.0, 7.0, 8.0, 7.0, 12.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.8065924644470215, -5.6538519859313965, -5.5011115074157715, -5.348371505737305, -5.19563102722168, -5.042890548706055, -4.89015007019043, -4.737409591674805, -4.58466911315918, -4.431928634643555, -4.27918815612793, -4.126448154449463, -3.973707675933838, -3.820967197418213, -3.668226718902588, -3.515486240386963, -3.362746238708496, -3.210005760192871, -3.057265520095825, -2.9045250415802, -2.7517848014831543, -2.5990443229675293, -2.4463038444519043, -2.2935633659362793, -2.1408231258392334, -1.988082766532898, -1.8353424072265625, -1.6826019287109375, -1.529861569404602, -1.3771212100982666, -1.2243807315826416, -1.0716403722763062, -0.9188995361328125, -0.766159176826477, -0.6134187579154968, -0.460678368806839, -0.30793797969818115, -0.1551976203918457, -0.0024572014808654785, 0.15028321743011475, 0.3030235767364502, 0.45576396584510803, 0.6085043549537659, 0.7612447738647461, 0.9139851331710815, 1.066725492477417, 1.219465970993042, 1.3722063302993774, 1.524946689605713, 1.6776870489120483, 1.8304274082183838, 1.9831678867340088, 2.1359081268310547, 2.2886486053466797, 2.4413890838623047, 2.5941295623779297, 2.7468698024749756, 2.8996102809906006, 3.0523505210876465, 3.2050909996032715, 3.3578314781188965, 3.5105717182159424, 3.6633121967315674, 3.8160524368286133, 3.9687929153442383]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 9.0, 3.0, 2.0, 8.0, 16.0, 18.0, 30.0, 49.0, 68.0, 122.0, 248.0, 578.0, 1361.0, 3380.0, 10370.0, 37686.0, 159048.0, 477311.0, 268950.0, 64244.0, 16483.0, 5107.0, 1922.0, 768.0, 355.0, 180.0, 87.0, 51.0, 36.0, 25.0, 7.0, 14.0, 7.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.2978515625, -1.2643051147460938, -1.2307586669921875, -1.1972122192382812, -1.163665771484375, -1.1301193237304688, -1.0965728759765625, -1.0630264282226562, -1.02947998046875, -0.9959335327148438, -0.9623870849609375, -0.9288406372070312, -0.895294189453125, -0.8617477416992188, -0.8282012939453125, -0.7946548461914062, -0.7611083984375, -0.7275619506835938, -0.6940155029296875, -0.6604690551757812, -0.626922607421875, -0.5933761596679688, -0.5598297119140625, -0.5262832641601562, -0.49273681640625, -0.45919036865234375, -0.4256439208984375, -0.39209747314453125, -0.358551025390625, -0.32500457763671875, -0.2914581298828125, -0.25791168212890625, -0.224365234375, -0.19081878662109375, -0.1572723388671875, -0.12372589111328125, -0.090179443359375, -0.05663299560546875, -0.0230865478515625, 0.01045989990234375, 0.04400634765625, 0.07755279541015625, 0.1110992431640625, 0.14464569091796875, 0.178192138671875, 0.21173858642578125, 0.2452850341796875, 0.27883148193359375, 0.3123779296875, 0.34592437744140625, 0.3794708251953125, 0.41301727294921875, 0.446563720703125, 0.48011016845703125, 0.5136566162109375, 0.5472030639648438, 0.58074951171875, 0.6142959594726562, 0.6478424072265625, 0.6813888549804688, 0.714935302734375, 0.7484817504882812, 0.7820281982421875, 0.8155746459960938, 0.84912109375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 3.0, 6.0, 7.0, 6.0, 11.0, 14.0, 15.0, 14.0, 27.0, 27.0, 20.0, 20.0, 42.0, 36.0, 41.0, 52.0, 49.0, 54.0, 48.0, 55.0, 53.0, 41.0, 50.0, 39.0, 24.0, 35.0, 34.0, 31.0, 26.0, 25.0, 23.0, 14.0, 13.0, 12.0, 4.0, 8.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.33349609375, -0.32195281982421875, -0.3104095458984375, -0.29886627197265625, -0.287322998046875, -0.27577972412109375, -0.2642364501953125, -0.25269317626953125, -0.24114990234375, -0.22960662841796875, -0.2180633544921875, -0.20652008056640625, -0.194976806640625, -0.18343353271484375, -0.1718902587890625, -0.16034698486328125, -0.1488037109375, -0.13726043701171875, -0.1257171630859375, -0.11417388916015625, -0.102630615234375, -0.09108734130859375, -0.0795440673828125, -0.06800079345703125, -0.05645751953125, -0.04491424560546875, -0.0333709716796875, -0.02182769775390625, -0.010284423828125, 0.00125885009765625, 0.0128021240234375, 0.02434539794921875, 0.035888671875, 0.04743194580078125, 0.0589752197265625, 0.07051849365234375, 0.082061767578125, 0.09360504150390625, 0.1051483154296875, 0.11669158935546875, 0.12823486328125, 0.13977813720703125, 0.1513214111328125, 0.16286468505859375, 0.174407958984375, 0.18595123291015625, 0.1974945068359375, 0.20903778076171875, 0.2205810546875, 0.23212432861328125, 0.2436676025390625, 0.25521087646484375, 0.266754150390625, 0.27829742431640625, 0.2898406982421875, 0.30138397216796875, 0.31292724609375, 0.32447052001953125, 0.3360137939453125, 0.34755706787109375, 0.359100341796875, 0.37064361572265625, 0.3821868896484375, 0.39373016357421875, 0.4052734375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 12.0, 9.0, 23.0, 31.0, 37.0, 61.0, 106.0, 138.0, 237.0, 349.0, 557.0, 870.0, 1783.0, 4456.0, 21167.0, 229345.0, 697755.0, 75811.0, 9566.0, 2887.0, 1325.0, 769.0, 438.0, 264.0, 186.0, 106.0, 78.0, 43.0, 38.0, 32.0, 24.0, 13.0, 14.0, 3.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0], "bins": [-1.8408203125, -1.7951202392578125, -1.749420166015625, -1.7037200927734375, -1.65802001953125, -1.6123199462890625, -1.566619873046875, -1.5209197998046875, -1.4752197265625, -1.4295196533203125, -1.383819580078125, -1.3381195068359375, -1.29241943359375, -1.2467193603515625, -1.201019287109375, -1.1553192138671875, -1.109619140625, -1.0639190673828125, -1.018218994140625, -0.9725189208984375, -0.92681884765625, -0.8811187744140625, -0.835418701171875, -0.7897186279296875, -0.7440185546875, -0.6983184814453125, -0.652618408203125, -0.6069183349609375, -0.56121826171875, -0.5155181884765625, -0.469818115234375, -0.4241180419921875, -0.37841796875, -0.3327178955078125, -0.287017822265625, -0.2413177490234375, -0.19561767578125, -0.1499176025390625, -0.104217529296875, -0.0585174560546875, -0.0128173828125, 0.0328826904296875, 0.078582763671875, 0.1242828369140625, 0.16998291015625, 0.2156829833984375, 0.261383056640625, 0.3070831298828125, 0.352783203125, 0.3984832763671875, 0.444183349609375, 0.4898834228515625, 0.53558349609375, 0.5812835693359375, 0.626983642578125, 0.6726837158203125, 0.7183837890625, 0.7640838623046875, 0.809783935546875, 0.8554840087890625, 0.90118408203125, 0.9468841552734375, 0.992584228515625, 1.0382843017578125, 1.083984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 14.0, 14.0, 9.0, 16.0, 24.0, 25.0, 32.0, 37.0, 38.0, 55.0, 48.0, 41.0, 43.0, 51.0, 52.0, 56.0, 60.0, 48.0, 50.0, 45.0, 36.0, 44.0, 26.0, 24.0, 21.0, 12.0, 15.0, 8.0, 11.0, 5.0, 2.0, 6.0, 4.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.514678955078125, -1.46295166015625, -1.411224365234375, -1.3594970703125, -1.307769775390625, -1.25604248046875, -1.204315185546875, -1.152587890625, -1.100860595703125, -1.04913330078125, -0.997406005859375, -0.9456787109375, -0.893951416015625, -0.84222412109375, -0.790496826171875, -0.73876953125, -0.687042236328125, -0.63531494140625, -0.583587646484375, -0.5318603515625, -0.480133056640625, -0.42840576171875, -0.376678466796875, -0.324951171875, -0.273223876953125, -0.22149658203125, -0.169769287109375, -0.1180419921875, -0.066314697265625, -0.01458740234375, 0.037139892578125, 0.0888671875, 0.140594482421875, 0.19232177734375, 0.244049072265625, 0.2957763671875, 0.347503662109375, 0.39923095703125, 0.450958251953125, 0.502685546875, 0.554412841796875, 0.60614013671875, 0.657867431640625, 0.7095947265625, 0.761322021484375, 0.81304931640625, 0.864776611328125, 0.91650390625, 0.968231201171875, 1.01995849609375, 1.071685791015625, 1.1234130859375, 1.175140380859375, 1.22686767578125, 1.278594970703125, 1.330322265625, 1.382049560546875, 1.43377685546875, 1.485504150390625, 1.5372314453125, 1.588958740234375, 1.64068603515625, 1.692413330078125, 1.744140625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 12.0, 7.0, 13.0, 17.0, 19.0, 25.0, 51.0, 64.0, 121.0, 193.0, 370.0, 824.0, 2243.0, 8800.0, 67347.0, 726345.0, 215849.0, 19929.0, 3870.0, 1248.0, 504.0, 265.0, 137.0, 89.0, 35.0, 44.0, 22.0, 21.0, 20.0, 10.0, 7.0, 3.0, 4.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.55517578125, -0.5364990234375, -0.517822265625, -0.4991455078125, -0.48046875, -0.4617919921875, -0.443115234375, -0.4244384765625, -0.40576171875, -0.3870849609375, -0.368408203125, -0.3497314453125, -0.3310546875, -0.3123779296875, -0.293701171875, -0.2750244140625, -0.25634765625, -0.2376708984375, -0.218994140625, -0.2003173828125, -0.181640625, -0.1629638671875, -0.144287109375, -0.1256103515625, -0.10693359375, -0.0882568359375, -0.069580078125, -0.0509033203125, -0.0322265625, -0.0135498046875, 0.005126953125, 0.0238037109375, 0.04248046875, 0.0611572265625, 0.079833984375, 0.0985107421875, 0.1171875, 0.1358642578125, 0.154541015625, 0.1732177734375, 0.19189453125, 0.2105712890625, 0.229248046875, 0.2479248046875, 0.2666015625, 0.2852783203125, 0.303955078125, 0.3226318359375, 0.34130859375, 0.3599853515625, 0.378662109375, 0.3973388671875, 0.416015625, 0.4346923828125, 0.453369140625, 0.4720458984375, 0.49072265625, 0.5093994140625, 0.528076171875, 0.5467529296875, 0.5654296875, 0.5841064453125, 0.602783203125, 0.6214599609375, 0.64013671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 8.0, 9.0, 14.0, 10.0, 12.0, 13.0, 19.0, 29.0, 38.0, 41.0, 69.0, 80.0, 78.0, 118.0, 91.0, 105.0, 48.0, 50.0, 34.0, 21.0, 33.0, 14.0, 17.0, 9.0, 9.0, 7.0, 4.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010442733764648438, -0.00010148249566555023, -9.853765368461609e-05, -9.559281170368195e-05, -9.26479697227478e-05, -8.970312774181366e-05, -8.675828576087952e-05, -8.381344377994537e-05, -8.086860179901123e-05, -7.792375981807709e-05, -7.497891783714294e-05, -7.20340758562088e-05, -6.908923387527466e-05, -6.614439189434052e-05, -6.319954991340637e-05, -6.025470793247223e-05, -5.7309865951538086e-05, -5.436502397060394e-05, -5.14201819896698e-05, -4.847534000873566e-05, -4.5530498027801514e-05, -4.258565604686737e-05, -3.964081406593323e-05, -3.6695972084999084e-05, -3.375113010406494e-05, -3.08062881231308e-05, -2.7861446142196655e-05, -2.4916604161262512e-05, -2.197176218032837e-05, -1.9026920199394226e-05, -1.6082078218460083e-05, -1.313723623752594e-05, -1.0192394256591797e-05, -7.247552275657654e-06, -4.302710294723511e-06, -1.3578683137893677e-06, 1.5869736671447754e-06, 4.5318156480789185e-06, 7.4766576290130615e-06, 1.0421499609947205e-05, 1.3366341590881348e-05, 1.631118357181549e-05, 1.9256025552749634e-05, 2.2200867533683777e-05, 2.514570951461792e-05, 2.8090551495552063e-05, 3.1035393476486206e-05, 3.398023545742035e-05, 3.692507743835449e-05, 3.9869919419288635e-05, 4.281476140022278e-05, 4.575960338115692e-05, 4.8704445362091064e-05, 5.164928734302521e-05, 5.459412932395935e-05, 5.7538971304893494e-05, 6.048381328582764e-05, 6.342865526676178e-05, 6.637349724769592e-05, 6.931833922863007e-05, 7.226318120956421e-05, 7.520802319049835e-05, 7.81528651714325e-05, 8.109770715236664e-05, 8.404254913330078e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 16.0, 22.0, 32.0, 44.0, 83.0, 127.0, 248.0, 471.0, 1060.0, 3048.0, 14583.0, 194610.0, 767026.0, 56962.0, 6808.0, 1878.0, 740.0, 355.0, 184.0, 83.0, 63.0, 38.0, 23.0, 10.0, 11.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68310546875, -0.6619491577148438, -0.6407928466796875, -0.6196365356445312, -0.598480224609375, -0.5773239135742188, -0.5561676025390625, -0.5350112915039062, -0.51385498046875, -0.49269866943359375, -0.4715423583984375, -0.45038604736328125, -0.429229736328125, -0.40807342529296875, -0.3869171142578125, -0.36576080322265625, -0.3446044921875, -0.32344818115234375, -0.3022918701171875, -0.28113555908203125, -0.259979248046875, -0.23882293701171875, -0.2176666259765625, -0.19651031494140625, -0.17535400390625, -0.15419769287109375, -0.1330413818359375, -0.11188507080078125, -0.090728759765625, -0.06957244873046875, -0.0484161376953125, -0.02725982666015625, -0.006103515625, 0.01505279541015625, 0.0362091064453125, 0.05736541748046875, 0.078521728515625, 0.09967803955078125, 0.1208343505859375, 0.14199066162109375, 0.16314697265625, 0.18430328369140625, 0.2054595947265625, 0.22661590576171875, 0.247772216796875, 0.26892852783203125, 0.2900848388671875, 0.31124114990234375, 0.3323974609375, 0.35355377197265625, 0.3747100830078125, 0.39586639404296875, 0.417022705078125, 0.43817901611328125, 0.4593353271484375, 0.48049163818359375, 0.50164794921875, 0.5228042602539062, 0.5439605712890625, 0.5651168823242188, 0.586273193359375, 0.6074295043945312, 0.6285858154296875, 0.6497421264648438, 0.6708984375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 4.0, 3.0, 7.0, 2.0, 1.0, 7.0, 7.0, 11.0, 18.0, 14.0, 17.0, 30.0, 24.0, 35.0, 36.0, 44.0, 47.0, 56.0, 55.0, 73.0, 56.0, 50.0, 54.0, 57.0, 56.0, 38.0, 31.0, 37.0, 26.0, 26.0, 15.0, 12.0, 15.0, 10.0, 9.0, 4.0, 2.0, 5.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.46337890625, -0.4516754150390625, -0.439971923828125, -0.4282684326171875, -0.41656494140625, -0.4048614501953125, -0.393157958984375, -0.3814544677734375, -0.3697509765625, -0.3580474853515625, -0.346343994140625, -0.3346405029296875, -0.32293701171875, -0.3112335205078125, -0.299530029296875, -0.2878265380859375, -0.276123046875, -0.2644195556640625, -0.252716064453125, -0.2410125732421875, -0.22930908203125, -0.2176055908203125, -0.205902099609375, -0.1941986083984375, -0.1824951171875, -0.1707916259765625, -0.159088134765625, -0.1473846435546875, -0.13568115234375, -0.1239776611328125, -0.112274169921875, -0.1005706787109375, -0.0888671875, -0.0771636962890625, -0.065460205078125, -0.0537567138671875, -0.04205322265625, -0.0303497314453125, -0.018646240234375, -0.0069427490234375, 0.0047607421875, 0.0164642333984375, 0.028167724609375, 0.0398712158203125, 0.05157470703125, 0.0632781982421875, 0.074981689453125, 0.0866851806640625, 0.098388671875, 0.1100921630859375, 0.121795654296875, 0.1334991455078125, 0.14520263671875, 0.1569061279296875, 0.168609619140625, 0.1803131103515625, 0.1920166015625, 0.2037200927734375, 0.215423583984375, 0.2271270751953125, 0.23883056640625, 0.2505340576171875, 0.262237548828125, 0.2739410400390625, 0.28564453125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 7.0, 28.0, 20.0, 52.0, 106.0, 143.0, 178.0, 168.0, 139.0, 89.0, 34.0, 10.0, 13.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.555559158325195, -13.2539644241333, -12.952369689941406, -12.650774955749512, -12.349180221557617, -12.047586441040039, -11.745991706848145, -11.44439697265625, -11.142802238464355, -10.841207504272461, -10.539612770080566, -10.238018035888672, -9.936424255371094, -9.6348295211792, -9.333234786987305, -9.03164005279541, -8.730045318603516, -8.428450584411621, -8.126855850219727, -7.82526159286499, -7.523666858673096, -7.222072124481201, -6.920477867126465, -6.61888313293457, -6.317288398742676, -6.015693664550781, -5.714098930358887, -5.41250467300415, -5.110909938812256, -4.809315204620361, -4.507720947265625, -4.2061262130737305, -3.904531955718994, -3.6029372215270996, -3.301342725753784, -2.9997482299804688, -2.698153495788574, -2.3965587615966797, -2.0949642658233643, -1.7933697700500488, -1.4917750358581543, -1.1901804208755493, -0.8885858058929443, -0.5869911909103394, -0.2853965759277344, 0.016198039054870605, 0.3177926540374756, 0.619387149810791, 0.9209818840026855, 1.2225764989852905, 1.5241711139678955, 1.8257657289505005, 2.1273603439331055, 2.428955078125, 2.7305495738983154, 3.032144069671631, 3.3337388038635254, 3.63533353805542, 3.9369280338287354, 4.238522529602051, 4.540117263793945, 4.84171199798584, 5.143306732177734, 5.444900989532471, 5.746495723724365]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 10.0, 5.0, 5.0, 7.0, 7.0, 17.0, 13.0, 21.0, 19.0, 29.0, 29.0, 36.0, 47.0, 39.0, 60.0, 81.0, 75.0, 83.0, 66.0, 44.0, 56.0, 44.0, 47.0, 44.0, 20.0, 22.0, 11.0, 17.0, 15.0, 9.0, 9.0, 6.0, 2.0, 1.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.460855484008789, -9.210884094238281, -8.960912704467773, -8.710941314697266, -8.460969924926758, -8.21099853515625, -7.961026668548584, -7.711055278778076, -7.461083889007568, -7.2111124992370605, -6.961141109466553, -6.711169719696045, -6.461197853088379, -6.211226463317871, -5.961255073547363, -5.7112836837768555, -5.461312294006348, -5.21134090423584, -4.961369514465332, -4.711398124694824, -4.461426734924316, -4.211455345153809, -3.9614834785461426, -3.7115120887756348, -3.461540699005127, -3.211569309234619, -2.9615979194641113, -2.7116262912750244, -2.4616549015045166, -2.211683511734009, -1.9617120027542114, -1.711740493774414, -1.4617695808410645, -1.2117981910705566, -0.9618266820907593, -0.7118552327156067, -0.4618837833404541, -0.2119123935699463, 0.038059115409851074, 0.28803062438964844, 0.5380020141601562, 0.7879734635353088, 1.0379449129104614, 1.2879164218902588, 1.5378878116607666, 1.7878592014312744, 2.0378308296203613, 2.287802219390869, 2.537773609161377, 2.7877449989318848, 3.0377163887023926, 3.2876880168914795, 3.5376594066619873, 3.787630796432495, 4.037602424621582, 4.28757381439209, 4.537545204162598, 4.7875165939331055, 5.037487983703613, 5.287459373474121, 5.537430763244629, 5.787402153015137, 6.037374019622803, 6.2873454093933105, 6.537316799163818]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 6.0, 7.0, 8.0, 19.0, 23.0, 26.0, 31.0, 42.0, 68.0, 65.0, 108.0, 146.0, 221.0, 474.0, 1182.0, 4962.0, 43933.0, 3606888.0, 514819.0, 16885.0, 2639.0, 736.0, 329.0, 191.0, 124.0, 91.0, 54.0, 53.0, 38.0, 30.0, 13.0, 11.0, 15.0, 7.0, 11.0, 6.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.884765625, -1.832122802734375, -1.77947998046875, -1.726837158203125, -1.6741943359375, -1.621551513671875, -1.56890869140625, -1.516265869140625, -1.463623046875, -1.410980224609375, -1.35833740234375, -1.305694580078125, -1.2530517578125, -1.200408935546875, -1.14776611328125, -1.095123291015625, -1.04248046875, -0.989837646484375, -0.93719482421875, -0.884552001953125, -0.8319091796875, -0.779266357421875, -0.72662353515625, -0.673980712890625, -0.621337890625, -0.568695068359375, -0.51605224609375, -0.463409423828125, -0.4107666015625, -0.358123779296875, -0.30548095703125, -0.252838134765625, -0.2001953125, -0.147552490234375, -0.09490966796875, -0.042266845703125, 0.0103759765625, 0.063018798828125, 0.11566162109375, 0.168304443359375, 0.220947265625, 0.273590087890625, 0.32623291015625, 0.378875732421875, 0.4315185546875, 0.484161376953125, 0.53680419921875, 0.589447021484375, 0.64208984375, 0.694732666015625, 0.74737548828125, 0.800018310546875, 0.8526611328125, 0.905303955078125, 0.95794677734375, 1.010589599609375, 1.063232421875, 1.115875244140625, 1.16851806640625, 1.221160888671875, 1.2738037109375, 1.326446533203125, 1.37908935546875, 1.431732177734375, 1.484375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 8.0, 12.0, 15.0, 17.0, 21.0, 21.0, 42.0, 47.0, 62.0, 80.0, 69.0, 69.0, 84.0, 86.0, 86.0, 62.0, 53.0, 39.0, 46.0, 27.0, 20.0, 10.0, 2.0, 8.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.4910888671875, -0.472900390625, -0.4547119140625, -0.4365234375, -0.4183349609375, -0.400146484375, -0.3819580078125, -0.36376953125, -0.3455810546875, -0.327392578125, -0.3092041015625, -0.291015625, -0.2728271484375, -0.254638671875, -0.2364501953125, -0.21826171875, -0.2000732421875, -0.181884765625, -0.1636962890625, -0.1455078125, -0.1273193359375, -0.109130859375, -0.0909423828125, -0.07275390625, -0.0545654296875, -0.036376953125, -0.0181884765625, 0.0, 0.0181884765625, 0.036376953125, 0.0545654296875, 0.07275390625, 0.0909423828125, 0.109130859375, 0.1273193359375, 0.1455078125, 0.1636962890625, 0.181884765625, 0.2000732421875, 0.21826171875, 0.2364501953125, 0.254638671875, 0.2728271484375, 0.291015625, 0.3092041015625, 0.327392578125, 0.3455810546875, 0.36376953125, 0.3819580078125, 0.400146484375, 0.4183349609375, 0.4365234375, 0.4547119140625, 0.472900390625, 0.4910888671875, 0.50927734375, 0.5274658203125, 0.545654296875, 0.5638427734375, 0.58203125, 0.6002197265625, 0.618408203125, 0.6365966796875, 0.65478515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 8.0, 13.0, 14.0, 18.0, 24.0, 42.0, 72.0, 108.0, 152.0, 280.0, 571.0, 1101.0, 2353.0, 5288.0, 13897.0, 46963.0, 308845.0, 3205780.0, 512751.0, 64021.0, 18409.0, 7136.0, 3131.0, 1520.0, 781.0, 422.0, 216.0, 127.0, 75.0, 40.0, 39.0, 19.0, 13.0, 11.0, 11.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84375, -0.8193588256835938, -0.7949676513671875, -0.7705764770507812, -0.746185302734375, -0.7217941284179688, -0.6974029541015625, -0.6730117797851562, -0.64862060546875, -0.6242294311523438, -0.5998382568359375, -0.5754470825195312, -0.551055908203125, -0.5266647338867188, -0.5022735595703125, -0.47788238525390625, -0.4534912109375, -0.42910003662109375, -0.4047088623046875, -0.38031768798828125, -0.355926513671875, -0.33153533935546875, -0.3071441650390625, -0.28275299072265625, -0.25836181640625, -0.23397064208984375, -0.2095794677734375, -0.18518829345703125, -0.160797119140625, -0.13640594482421875, -0.1120147705078125, -0.08762359619140625, -0.063232421875, -0.03884124755859375, -0.0144500732421875, 0.00994110107421875, 0.034332275390625, 0.05872344970703125, 0.0831146240234375, 0.10750579833984375, 0.13189697265625, 0.15628814697265625, 0.1806793212890625, 0.20507049560546875, 0.229461669921875, 0.25385284423828125, 0.2782440185546875, 0.30263519287109375, 0.3270263671875, 0.35141754150390625, 0.3758087158203125, 0.40019989013671875, 0.424591064453125, 0.44898223876953125, 0.4733734130859375, 0.49776458740234375, 0.52215576171875, 0.5465469360351562, 0.5709381103515625, 0.5953292846679688, 0.619720458984375, 0.6441116333007812, 0.6685028076171875, 0.6928939819335938, 0.71728515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 2.0, 5.0, 7.0, 14.0, 17.0, 25.0, 43.0, 73.0, 97.0, 176.0, 339.0, 570.0, 860.0, 741.0, 455.0, 226.0, 137.0, 74.0, 48.0, 36.0, 21.0, 16.0, 13.0, 18.0, 9.0, 11.0, 6.0, 1.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8662109375, -0.83892822265625, -0.8116455078125, -0.78436279296875, -0.757080078125, -0.72979736328125, -0.7025146484375, -0.67523193359375, -0.64794921875, -0.62066650390625, -0.5933837890625, -0.56610107421875, -0.538818359375, -0.51153564453125, -0.4842529296875, -0.45697021484375, -0.4296875, -0.40240478515625, -0.3751220703125, -0.34783935546875, -0.320556640625, -0.29327392578125, -0.2659912109375, -0.23870849609375, -0.21142578125, -0.18414306640625, -0.1568603515625, -0.12957763671875, -0.102294921875, -0.07501220703125, -0.0477294921875, -0.02044677734375, 0.0068359375, 0.03411865234375, 0.0614013671875, 0.08868408203125, 0.115966796875, 0.14324951171875, 0.1705322265625, 0.19781494140625, 0.22509765625, 0.25238037109375, 0.2796630859375, 0.30694580078125, 0.334228515625, 0.36151123046875, 0.3887939453125, 0.41607666015625, 0.443359375, 0.47064208984375, 0.4979248046875, 0.52520751953125, 0.552490234375, 0.57977294921875, 0.6070556640625, 0.63433837890625, 0.66162109375, 0.68890380859375, 0.7161865234375, 0.74346923828125, 0.770751953125, 0.79803466796875, 0.8253173828125, 0.85260009765625, 0.8798828125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 34.0, 127.0, 341.0, 311.0, 121.0, 28.0, 12.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.42849349975586, -17.928373336791992, -17.428253173828125, -16.92813491821289, -16.428014755249023, -15.927894592285156, -15.427775382995605, -14.927656173706055, -14.427536010742188, -13.92741584777832, -13.42729663848877, -12.927177429199219, -12.427057266235352, -11.926937103271484, -11.426817893981934, -10.926698684692383, -10.426578521728516, -9.926458358764648, -9.426339149475098, -8.926219940185547, -8.42609977722168, -7.925980091094971, -7.425860404968262, -6.925740718841553, -6.425621032714844, -5.925501346588135, -5.425381660461426, -4.925261974334717, -4.425142288208008, -3.925022602081299, -3.42490291595459, -2.924783229827881, -2.424661636352539, -1.92454195022583, -1.424422264099121, -0.9243025779724121, -0.4241828918457031, 0.07593679428100586, 0.5760564804077148, 1.0761761665344238, 1.5762958526611328, 2.076415538787842, 2.576535224914551, 3.0766549110412598, 3.5767745971679688, 4.076894283294678, 4.577013969421387, 5.077133655548096, 5.577253341674805, 6.077373027801514, 6.577492713928223, 7.077612400054932, 7.577732086181641, 8.077852249145508, 8.577971458435059, 9.07809066772461, 9.578210830688477, 10.078330993652344, 10.578450202941895, 11.078569412231445, 11.578689575195312, 12.07880973815918, 12.57892894744873, 13.079048156738281, 13.579168319702148]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 4.0, 12.0, 17.0, 18.0, 27.0, 40.0, 48.0, 33.0, 43.0, 50.0, 64.0, 50.0, 69.0, 61.0, 72.0, 48.0, 51.0, 47.0, 35.0, 47.0, 31.0, 27.0, 28.0, 16.0, 9.0, 9.0, 7.0, 9.0, 8.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.135585784912109, -5.9689154624938965, -5.802245616912842, -5.635575294494629, -5.468905448913574, -5.302235126495361, -5.135564804077148, -4.968894958496094, -4.802224636077881, -4.635554313659668, -4.468884468078613, -4.3022141456604, -4.135544300079346, -3.968873977661133, -3.802203893661499, -3.6355338096618652, -3.4688637256622314, -3.3021936416625977, -3.135523557662964, -2.96885347366333, -2.802183151245117, -2.6355130672454834, -2.4688429832458496, -2.3021726608276367, -2.135502815246582, -1.9688327312469482, -1.802162528038025, -1.6354924440383911, -1.4688222408294678, -1.302152156829834, -1.1354820728302002, -0.9688118696212769, -0.8021416664123535, -0.635471522808075, -0.4688014090061188, -0.3021312952041626, -0.13546115159988403, 0.03120899200439453, 0.19787907600402832, 0.36454927921295166, 0.5312193632125854, 0.697889506816864, 0.8645596504211426, 1.0312297344207764, 1.1978998184204102, 1.3645700216293335, 1.5312401056289673, 1.6979103088378906, 1.8645803928375244, 2.031250476837158, 2.197920560836792, 2.364590644836426, 2.5312609672546387, 2.6979310512542725, 2.8646011352539062, 3.031271457672119, 3.197941303253174, 3.3646113872528076, 3.5312814712524414, 3.6979517936706543, 3.864621877670288, 4.031291961669922, 4.197961807250977, 4.3646321296691895, 4.531302452087402]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 18.0, 13.0, 23.0, 45.0, 72.0, 132.0, 263.0, 607.0, 1273.0, 3343.0, 9624.0, 33429.0, 137254.0, 458068.0, 303430.0, 72172.0, 18940.0, 5952.0, 2152.0, 892.0, 352.0, 216.0, 100.0, 65.0, 29.0, 20.0, 18.0, 9.0, 11.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93994140625, -0.9083786010742188, -0.8768157958984375, -0.8452529907226562, -0.813690185546875, -0.7821273803710938, -0.7505645751953125, -0.7190017700195312, -0.68743896484375, -0.6558761596679688, -0.6243133544921875, -0.5927505493164062, -0.561187744140625, -0.5296249389648438, -0.4980621337890625, -0.46649932861328125, -0.4349365234375, -0.40337371826171875, -0.3718109130859375, -0.34024810791015625, -0.308685302734375, -0.27712249755859375, -0.2455596923828125, -0.21399688720703125, -0.18243408203125, -0.15087127685546875, -0.1193084716796875, -0.08774566650390625, -0.056182861328125, -0.02462005615234375, 0.0069427490234375, 0.03850555419921875, 0.070068359375, 0.10163116455078125, 0.1331939697265625, 0.16475677490234375, 0.196319580078125, 0.22788238525390625, 0.2594451904296875, 0.29100799560546875, 0.32257080078125, 0.35413360595703125, 0.3856964111328125, 0.41725921630859375, 0.448822021484375, 0.48038482666015625, 0.5119476318359375, 0.5435104370117188, 0.5750732421875, 0.6066360473632812, 0.6381988525390625, 0.6697616577148438, 0.701324462890625, 0.7328872680664062, 0.7644500732421875, 0.7960128784179688, 0.82757568359375, 0.8591384887695312, 0.8907012939453125, 0.9222640991210938, 0.953826904296875, 0.9853897094726562, 1.0169525146484375, 1.0485153198242188, 1.080078125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 1.0, 10.0, 8.0, 10.0, 13.0, 30.0, 22.0, 25.0, 30.0, 42.0, 45.0, 65.0, 69.0, 85.0, 83.0, 64.0, 75.0, 57.0, 59.0, 58.0, 42.0, 30.0, 32.0, 17.0, 14.0, 9.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44189453125, -0.42455291748046875, -0.4072113037109375, -0.38986968994140625, -0.372528076171875, -0.35518646240234375, -0.3378448486328125, -0.32050323486328125, -0.30316162109375, -0.28582000732421875, -0.2684783935546875, -0.25113677978515625, -0.233795166015625, -0.21645355224609375, -0.1991119384765625, -0.18177032470703125, -0.1644287109375, -0.14708709716796875, -0.1297454833984375, -0.11240386962890625, -0.095062255859375, -0.07772064208984375, -0.0603790283203125, -0.04303741455078125, -0.02569580078125, -0.00835418701171875, 0.0089874267578125, 0.02632904052734375, 0.043670654296875, 0.06101226806640625, 0.0783538818359375, 0.09569549560546875, 0.113037109375, 0.13037872314453125, 0.1477203369140625, 0.16506195068359375, 0.182403564453125, 0.19974517822265625, 0.2170867919921875, 0.23442840576171875, 0.25177001953125, 0.26911163330078125, 0.2864532470703125, 0.30379486083984375, 0.321136474609375, 0.33847808837890625, 0.3558197021484375, 0.37316131591796875, 0.3905029296875, 0.40784454345703125, 0.4251861572265625, 0.44252777099609375, 0.459869384765625, 0.47721099853515625, 0.4945526123046875, 0.5118942260742188, 0.52923583984375, 0.5465774536132812, 0.5639190673828125, 0.5812606811523438, 0.598602294921875, 0.6159439086914062, 0.6332855224609375, 0.6506271362304688, 0.66796875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 4.0, 13.0, 9.0, 17.0, 19.0, 47.0, 75.0, 90.0, 136.0, 228.0, 398.0, 727.0, 1636.0, 4645.0, 24028.0, 234389.0, 687622.0, 78835.0, 10362.0, 2737.0, 1164.0, 528.0, 289.0, 177.0, 124.0, 68.0, 50.0, 38.0, 19.0, 21.0, 16.0, 11.0, 3.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.383026123046875, -1.33734130859375, -1.291656494140625, -1.2459716796875, -1.200286865234375, -1.15460205078125, -1.108917236328125, -1.063232421875, -1.017547607421875, -0.97186279296875, -0.926177978515625, -0.8804931640625, -0.834808349609375, -0.78912353515625, -0.743438720703125, -0.69775390625, -0.652069091796875, -0.60638427734375, -0.560699462890625, -0.5150146484375, -0.469329833984375, -0.42364501953125, -0.377960205078125, -0.332275390625, -0.286590576171875, -0.24090576171875, -0.195220947265625, -0.1495361328125, -0.103851318359375, -0.05816650390625, -0.012481689453125, 0.033203125, 0.078887939453125, 0.12457275390625, 0.170257568359375, 0.2159423828125, 0.261627197265625, 0.30731201171875, 0.352996826171875, 0.398681640625, 0.444366455078125, 0.49005126953125, 0.535736083984375, 0.5814208984375, 0.627105712890625, 0.67279052734375, 0.718475341796875, 0.76416015625, 0.809844970703125, 0.85552978515625, 0.901214599609375, 0.9468994140625, 0.992584228515625, 1.03826904296875, 1.083953857421875, 1.129638671875, 1.175323486328125, 1.22100830078125, 1.266693115234375, 1.3123779296875, 1.358062744140625, 1.40374755859375, 1.449432373046875, 1.4951171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 8.0, 15.0, 19.0, 16.0, 29.0, 32.0, 29.0, 37.0, 35.0, 40.0, 48.0, 57.0, 64.0, 62.0, 64.0, 43.0, 52.0, 58.0, 50.0, 43.0, 35.0, 31.0, 30.0, 22.0, 16.0, 12.0, 14.0, 11.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.599609375, -1.542816162109375, -1.48602294921875, -1.429229736328125, -1.3724365234375, -1.315643310546875, -1.25885009765625, -1.202056884765625, -1.145263671875, -1.088470458984375, -1.03167724609375, -0.974884033203125, -0.9180908203125, -0.861297607421875, -0.80450439453125, -0.747711181640625, -0.69091796875, -0.634124755859375, -0.57733154296875, -0.520538330078125, -0.4637451171875, -0.406951904296875, -0.35015869140625, -0.293365478515625, -0.236572265625, -0.179779052734375, -0.12298583984375, -0.066192626953125, -0.0093994140625, 0.047393798828125, 0.10418701171875, 0.160980224609375, 0.2177734375, 0.274566650390625, 0.33135986328125, 0.388153076171875, 0.4449462890625, 0.501739501953125, 0.55853271484375, 0.615325927734375, 0.672119140625, 0.728912353515625, 0.78570556640625, 0.842498779296875, 0.8992919921875, 0.956085205078125, 1.01287841796875, 1.069671630859375, 1.12646484375, 1.183258056640625, 1.24005126953125, 1.296844482421875, 1.3536376953125, 1.410430908203125, 1.46722412109375, 1.524017333984375, 1.580810546875, 1.637603759765625, 1.69439697265625, 1.751190185546875, 1.8079833984375, 1.864776611328125, 1.92156982421875, 1.978363037109375, 2.03515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 4.0, 5.0, 6.0, 6.0, 15.0, 31.0, 64.0, 115.0, 291.0, 936.0, 5584.0, 220089.0, 804829.0, 14237.0, 1586.0, 408.0, 162.0, 75.0, 33.0, 22.0, 16.0, 9.0, 6.0, 8.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0439453125, -1.00933837890625, -0.9747314453125, -0.94012451171875, -0.905517578125, -0.87091064453125, -0.8363037109375, -0.80169677734375, -0.76708984375, -0.73248291015625, -0.6978759765625, -0.66326904296875, -0.628662109375, -0.59405517578125, -0.5594482421875, -0.52484130859375, -0.490234375, -0.45562744140625, -0.4210205078125, -0.38641357421875, -0.351806640625, -0.31719970703125, -0.2825927734375, -0.24798583984375, -0.21337890625, -0.17877197265625, -0.1441650390625, -0.10955810546875, -0.074951171875, -0.04034423828125, -0.0057373046875, 0.02886962890625, 0.0634765625, 0.09808349609375, 0.1326904296875, 0.16729736328125, 0.201904296875, 0.23651123046875, 0.2711181640625, 0.30572509765625, 0.34033203125, 0.37493896484375, 0.4095458984375, 0.44415283203125, 0.478759765625, 0.51336669921875, 0.5479736328125, 0.58258056640625, 0.6171875, 0.65179443359375, 0.6864013671875, 0.72100830078125, 0.755615234375, 0.79022216796875, 0.8248291015625, 0.85943603515625, 0.89404296875, 0.92864990234375, 0.9632568359375, 0.99786376953125, 1.032470703125, 1.06707763671875, 1.1016845703125, 1.13629150390625, 1.1708984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 7.0, 13.0, 18.0, 30.0, 45.0, 64.0, 108.0, 121.0, 139.0, 122.0, 110.0, 78.0, 44.0, 29.0, 26.0, 14.0, 9.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012564659118652344, -0.00012168660759925842, -0.00011772662401199341, -0.0001137666404247284, -0.00010980665683746338, -0.00010584667325019836, -0.00010188668966293335, -9.792670607566833e-05, -9.396672248840332e-05, -9.00067389011383e-05, -8.604675531387329e-05, -8.208677172660828e-05, -7.812678813934326e-05, -7.416680455207825e-05, -7.020682096481323e-05, -6.624683737754822e-05, -6.22868537902832e-05, -5.832687020301819e-05, -5.4366886615753174e-05, -5.040690302848816e-05, -4.6446919441223145e-05, -4.248693585395813e-05, -3.8526952266693115e-05, -3.45669686794281e-05, -3.0606985092163086e-05, -2.664700150489807e-05, -2.2687017917633057e-05, -1.8727034330368042e-05, -1.4767050743103027e-05, -1.0807067155838013e-05, -6.847083568572998e-06, -2.8870999813079834e-06, 1.0728836059570312e-06, 5.032867193222046e-06, 8.99285078048706e-06, 1.2952834367752075e-05, 1.691281795501709e-05, 2.0872801542282104e-05, 2.483278512954712e-05, 2.8792768716812134e-05, 3.275275230407715e-05, 3.671273589134216e-05, 4.067271947860718e-05, 4.463270306587219e-05, 4.859268665313721e-05, 5.255267024040222e-05, 5.6512653827667236e-05, 6.047263741493225e-05, 6.443262100219727e-05, 6.839260458946228e-05, 7.23525881767273e-05, 7.631257176399231e-05, 8.027255535125732e-05, 8.423253893852234e-05, 8.819252252578735e-05, 9.215250611305237e-05, 9.611248970031738e-05, 0.0001000724732875824, 0.00010403245687484741, 0.00010799244046211243, 0.00011195242404937744, 0.00011591240763664246, 0.00011987239122390747, 0.00012383237481117249, 0.0001277923583984375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 7.0, 9.0, 9.0, 12.0, 17.0, 29.0, 46.0, 68.0, 101.0, 150.0, 284.0, 596.0, 1228.0, 3278.0, 12226.0, 91897.0, 683452.0, 223140.0, 23736.0, 4915.0, 1719.0, 734.0, 372.0, 210.0, 117.0, 64.0, 50.0, 23.0, 14.0, 15.0, 15.0, 8.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.54486083984375, -0.5286865234375, -0.51251220703125, -0.496337890625, -0.48016357421875, -0.4639892578125, -0.44781494140625, -0.431640625, -0.41546630859375, -0.3992919921875, -0.38311767578125, -0.366943359375, -0.35076904296875, -0.3345947265625, -0.31842041015625, -0.30224609375, -0.28607177734375, -0.2698974609375, -0.25372314453125, -0.237548828125, -0.22137451171875, -0.2052001953125, -0.18902587890625, -0.1728515625, -0.15667724609375, -0.1405029296875, -0.12432861328125, -0.108154296875, -0.09197998046875, -0.0758056640625, -0.05963134765625, -0.04345703125, -0.02728271484375, -0.0111083984375, 0.00506591796875, 0.021240234375, 0.03741455078125, 0.0535888671875, 0.06976318359375, 0.0859375, 0.10211181640625, 0.1182861328125, 0.13446044921875, 0.150634765625, 0.16680908203125, 0.1829833984375, 0.19915771484375, 0.21533203125, 0.23150634765625, 0.2476806640625, 0.26385498046875, 0.280029296875, 0.29620361328125, 0.3123779296875, 0.32855224609375, 0.3447265625, 0.36090087890625, 0.3770751953125, 0.39324951171875, 0.409423828125, 0.42559814453125, 0.4417724609375, 0.45794677734375, 0.47412109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 10.0, 10.0, 24.0, 25.0, 46.0, 40.0, 70.0, 90.0, 94.0, 105.0, 85.0, 91.0, 84.0, 59.0, 45.0, 37.0, 13.0, 21.0, 13.0, 9.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.66748046875, -0.6488418579101562, -0.6302032470703125, -0.6115646362304688, -0.592926025390625, -0.5742874145507812, -0.5556488037109375, -0.5370101928710938, -0.51837158203125, -0.49973297119140625, -0.4810943603515625, -0.46245574951171875, -0.443817138671875, -0.42517852783203125, -0.4065399169921875, -0.38790130615234375, -0.3692626953125, -0.35062408447265625, -0.3319854736328125, -0.31334686279296875, -0.294708251953125, -0.27606964111328125, -0.2574310302734375, -0.23879241943359375, -0.22015380859375, -0.20151519775390625, -0.1828765869140625, -0.16423797607421875, -0.145599365234375, -0.12696075439453125, -0.1083221435546875, -0.08968353271484375, -0.071044921875, -0.05240631103515625, -0.0337677001953125, -0.01512908935546875, 0.003509521484375, 0.02214813232421875, 0.0407867431640625, 0.05942535400390625, 0.07806396484375, 0.09670257568359375, 0.1153411865234375, 0.13397979736328125, 0.152618408203125, 0.17125701904296875, 0.1898956298828125, 0.20853424072265625, 0.2271728515625, 0.24581146240234375, 0.2644500732421875, 0.28308868408203125, 0.301727294921875, 0.32036590576171875, 0.3390045166015625, 0.35764312744140625, 0.37628173828125, 0.39492034912109375, 0.4135589599609375, 0.43219757080078125, 0.450836181640625, 0.46947479248046875, 0.4881134033203125, 0.5067520141601562, 0.525390625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 12.0, 40.0, 108.0, 223.0, 300.0, 182.0, 79.0, 23.0, 10.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.266334533691406, -18.833110809326172, -18.399887084960938, -17.966663360595703, -17.53343963623047, -17.100215911865234, -16.6669921875, -16.233768463134766, -15.800543785095215, -15.36732006072998, -14.934096336364746, -14.500872611999512, -14.067647933959961, -13.634424209594727, -13.201200485229492, -12.767976760864258, -12.334753036499023, -11.901529312133789, -11.468305587768555, -11.03508186340332, -10.601858139038086, -10.168634414672852, -9.7354097366333, -9.302186012268066, -8.868962287902832, -8.435738563537598, -8.002514839172363, -7.569290637969971, -7.136066913604736, -6.702843189239502, -6.269618988037109, -5.836395263671875, -5.403171539306641, -4.969947814941406, -4.536724090576172, -4.103499889373779, -3.670276165008545, -3.2370524406433105, -2.803828477859497, -2.3706045150756836, -1.9373807907104492, -1.5041569471359253, -1.0709331035614014, -0.6377092599868774, -0.20448541641235352, 0.22873830795288086, 0.6619622707366943, 1.0951862335205078, 1.5284099578857422, 1.9616338014602661, 2.39485764503479, 2.8280816078186035, 3.261305332183838, 3.6945290565490723, 4.127753257751465, 4.560976982116699, 4.994200706481934, 5.427424430847168, 5.860648155212402, 6.293872356414795, 6.727096080780029, 7.160319805145264, 7.593544006347656, 8.02676773071289, 8.459991455078125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 13.0, 22.0, 22.0, 31.0, 45.0, 55.0, 81.0, 76.0, 93.0, 107.0, 98.0, 74.0, 70.0, 53.0, 42.0, 33.0, 17.0, 16.0, 10.0, 16.0, 6.0, 7.0, 2.0, 3.0, 4.0], "bins": [-18.6641902923584, -18.279586791992188, -17.894981384277344, -17.510377883911133, -17.12577247619629, -16.741168975830078, -16.356563568115234, -15.971959114074707, -15.58735466003418, -15.202750205993652, -14.818145751953125, -14.433541297912598, -14.04893684387207, -13.664332389831543, -13.279727935791016, -12.895123481750488, -12.510519027709961, -12.125914573669434, -11.741310119628906, -11.356705665588379, -10.972101211547852, -10.587496757507324, -10.202892303466797, -9.81828784942627, -9.433684349060059, -9.049079895019531, -8.664475440979004, -8.279870986938477, -7.895266532897949, -7.510662078857422, -7.1260576248168945, -6.741453170776367, -6.35684871673584, -5.9722442626953125, -5.587639808654785, -5.203035354614258, -4.8184309005737305, -4.433826446533203, -4.049221992492676, -3.6646177768707275, -3.2800133228302, -2.895408868789673, -2.5108044147491455, -2.1262001991271973, -1.7415956258773804, -1.356991171836853, -0.9723868370056152, -0.5877823829650879, -0.20317792892456055, 0.1814264953136444, 0.5660309195518494, 0.9506353139877319, 1.3352397680282593, 1.7198442220687866, 2.1044485569000244, 2.4890530109405518, 2.873657464981079, 3.2582619190216064, 3.642866373062134, 4.027470588684082, 4.412075042724609, 4.796679496765137, 5.181283950805664, 5.565888404846191, 5.950492858886719]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 6.0, 9.0, 7.0, 9.0, 16.0, 20.0, 18.0, 36.0, 38.0, 67.0, 90.0, 162.0, 283.0, 720.0, 2045.0, 7367.0, 37705.0, 400046.0, 3366171.0, 331779.0, 35427.0, 7881.0, 2441.0, 1028.0, 422.0, 224.0, 104.0, 57.0, 39.0, 14.0, 17.0, 8.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.08984375, -1.0622329711914062, -1.0346221923828125, -1.0070114135742188, -0.979400634765625, -0.9517898559570312, -0.9241790771484375, -0.8965682983398438, -0.86895751953125, -0.8413467407226562, -0.8137359619140625, -0.7861251831054688, -0.758514404296875, -0.7309036254882812, -0.7032928466796875, -0.6756820678710938, -0.6480712890625, -0.6204605102539062, -0.5928497314453125, -0.5652389526367188, -0.537628173828125, -0.5100173950195312, -0.4824066162109375, -0.45479583740234375, -0.42718505859375, -0.39957427978515625, -0.3719635009765625, -0.34435272216796875, -0.316741943359375, -0.28913116455078125, -0.2615203857421875, -0.23390960693359375, -0.206298828125, -0.17868804931640625, -0.1510772705078125, -0.12346649169921875, -0.095855712890625, -0.06824493408203125, -0.0406341552734375, -0.01302337646484375, 0.01458740234375, 0.04219818115234375, 0.0698089599609375, 0.09741973876953125, 0.125030517578125, 0.15264129638671875, 0.1802520751953125, 0.20786285400390625, 0.2354736328125, 0.26308441162109375, 0.2906951904296875, 0.31830596923828125, 0.345916748046875, 0.37352752685546875, 0.4011383056640625, 0.42874908447265625, 0.45635986328125, 0.48397064208984375, 0.5115814208984375, 0.5391921997070312, 0.566802978515625, 0.5944137573242188, 0.6220245361328125, 0.6496353149414062, 0.67724609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 19.0, 22.0, 33.0, 56.0, 94.0, 125.0, 155.0, 131.0, 135.0, 94.0, 64.0, 34.0, 28.0, 7.0, 8.0, 3.0, 3.0], "bins": [-1.650390625, -1.6197929382324219, -1.5891952514648438, -1.5585975646972656, -1.5279998779296875, -1.4974021911621094, -1.4668045043945312, -1.4362068176269531, -1.405609130859375, -1.3750114440917969, -1.3444137573242188, -1.3138160705566406, -1.2832183837890625, -1.2526206970214844, -1.2220230102539062, -1.1914253234863281, -1.16082763671875, -1.1302299499511719, -1.0996322631835938, -1.0690345764160156, -1.0384368896484375, -1.0078392028808594, -0.9772415161132812, -0.9466438293457031, -0.916046142578125, -0.8854484558105469, -0.8548507690429688, -0.8242530822753906, -0.7936553955078125, -0.7630577087402344, -0.7324600219726562, -0.7018623352050781, -0.6712646484375, -0.6406669616699219, -0.6100692749023438, -0.5794715881347656, -0.5488739013671875, -0.5182762145996094, -0.48767852783203125, -0.4570808410644531, -0.426483154296875, -0.3958854675292969, -0.36528778076171875, -0.3346900939941406, -0.3040924072265625, -0.2734947204589844, -0.24289703369140625, -0.21229934692382812, -0.18170166015625, -0.15110397338867188, -0.12050628662109375, -0.08990859985351562, -0.0593109130859375, -0.028713226318359375, 0.00188446044921875, 0.032482147216796875, 0.063079833984375, 0.09367752075195312, 0.12427520751953125, 0.15487289428710938, 0.1854705810546875, 0.21606826782226562, 0.24666595458984375, 0.2772636413574219, 0.307861328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 11.0, 17.0, 33.0, 24.0, 24.0, 36.0, 76.0, 130.0, 185.0, 325.0, 723.0, 1841.0, 5041.0, 16946.0, 77204.0, 1001704.0, 2875080.0, 170930.0, 30809.0, 8128.0, 2672.0, 1074.0, 546.0, 255.0, 147.0, 99.0, 73.0, 47.0, 30.0, 24.0, 8.0, 9.0, 8.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7705078125, -0.7431640625, -0.7158203125, -0.6884765625, -0.6611328125, -0.6337890625, -0.6064453125, -0.5791015625, -0.5517578125, -0.5244140625, -0.4970703125, -0.4697265625, -0.4423828125, -0.4150390625, -0.3876953125, -0.3603515625, -0.3330078125, -0.3056640625, -0.2783203125, -0.2509765625, -0.2236328125, -0.1962890625, -0.1689453125, -0.1416015625, -0.1142578125, -0.0869140625, -0.0595703125, -0.0322265625, -0.0048828125, 0.0224609375, 0.0498046875, 0.0771484375, 0.1044921875, 0.1318359375, 0.1591796875, 0.1865234375, 0.2138671875, 0.2412109375, 0.2685546875, 0.2958984375, 0.3232421875, 0.3505859375, 0.3779296875, 0.4052734375, 0.4326171875, 0.4599609375, 0.4873046875, 0.5146484375, 0.5419921875, 0.5693359375, 0.5966796875, 0.6240234375, 0.6513671875, 0.6787109375, 0.7060546875, 0.7333984375, 0.7607421875, 0.7880859375, 0.8154296875, 0.8427734375, 0.8701171875, 0.8974609375, 0.9248046875, 0.9521484375, 0.9794921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 2.0, 6.0, 7.0, 12.0, 14.0, 24.0, 39.0, 46.0, 60.0, 103.0, 199.0, 295.0, 566.0, 780.0, 702.0, 430.0, 236.0, 180.0, 90.0, 84.0, 43.0, 30.0, 30.0, 21.0, 17.0, 10.0, 12.0, 9.0, 6.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.91796875, -0.8881607055664062, -0.8583526611328125, -0.8285446166992188, -0.798736572265625, -0.7689285278320312, -0.7391204833984375, -0.7093124389648438, -0.67950439453125, -0.6496963500976562, -0.6198883056640625, -0.5900802612304688, -0.560272216796875, -0.5304641723632812, -0.5006561279296875, -0.47084808349609375, -0.4410400390625, -0.41123199462890625, -0.3814239501953125, -0.35161590576171875, -0.321807861328125, -0.29199981689453125, -0.2621917724609375, -0.23238372802734375, -0.20257568359375, -0.17276763916015625, -0.1429595947265625, -0.11315155029296875, -0.083343505859375, -0.05353546142578125, -0.0237274169921875, 0.00608062744140625, 0.035888671875, 0.06569671630859375, 0.0955047607421875, 0.12531280517578125, 0.155120849609375, 0.18492889404296875, 0.2147369384765625, 0.24454498291015625, 0.27435302734375, 0.30416107177734375, 0.3339691162109375, 0.36377716064453125, 0.393585205078125, 0.42339324951171875, 0.4532012939453125, 0.48300933837890625, 0.5128173828125, 0.5426254272460938, 0.5724334716796875, 0.6022415161132812, 0.632049560546875, 0.6618576049804688, 0.6916656494140625, 0.7214736938476562, 0.75128173828125, 0.7810897827148438, 0.8108978271484375, 0.8407058715820312, 0.870513916015625, 0.9003219604492188, 0.9301300048828125, 0.9599380493164062, 0.98974609375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 11.0, 30.0, 60.0, 165.0, 250.0, 208.0, 153.0, 54.0, 33.0, 11.0, 4.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.791822910308838, -7.416045188903809, -7.040267467498779, -6.66448974609375, -6.2887115478515625, -5.912933826446533, -5.537156105041504, -5.161377906799316, -4.785600662231445, -4.409822940826416, -4.034045219421387, -3.6582672595977783, -3.28248929977417, -2.9067115783691406, -2.5309338569641113, -2.155155897140503, -1.7793779373168945, -1.4036000967025757, -1.0278222560882568, -0.6520445346832275, -0.2762666940689087, 0.09951114654541016, 0.47528886795043945, 0.8510668277740479, 1.2268445491790771, 1.602622389793396, 1.9784002304077148, 2.354177951812744, 2.7299556732177734, 3.105733633041382, 3.481511354446411, 3.8572893142700195, 4.233067512512207, 4.608845233917236, 4.984622955322266, 5.360401153564453, 5.736178874969482, 6.111956596374512, 6.487734317779541, 6.86351203918457, 7.239290237426758, 7.615067958831787, 7.990845680236816, 8.366623878479004, 8.742401123046875, 9.118179321289062, 9.49395751953125, 9.869734764099121, 10.245512008666992, 10.62129020690918, 10.99706745147705, 11.372845649719238, 11.74862289428711, 12.124401092529297, 12.500179290771484, 12.875956535339355, 13.251734733581543, 13.62751293182373, 14.003290176391602, 14.379068374633789, 14.75484561920166, 15.130623817443848, 15.506401062011719, 15.882179260253906, 16.257957458496094]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 9.0, 9.0, 19.0, 21.0, 47.0, 53.0, 46.0, 71.0, 92.0, 73.0, 98.0, 88.0, 83.0, 77.0, 56.0, 51.0, 29.0, 26.0, 25.0, 9.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.828957557678223, -5.5522847175598145, -5.275611877441406, -4.998939037322998, -4.72226619720459, -4.445592880249023, -4.168920040130615, -3.892247200012207, -3.615574359893799, -3.3389015197753906, -3.0622286796569824, -2.785555601119995, -2.508882761001587, -2.2322099208831787, -1.955536961555481, -1.6788640022277832, -1.402191162109375, -1.1255183219909668, -0.848845362663269, -0.5721724629402161, -0.2954995632171631, -0.018826723098754883, 0.25784623622894287, 0.5345191955566406, 0.8111920356750488, 1.087864875793457, 1.3645378351211548, 1.6412107944488525, 1.9178836345672607, 2.194556474685669, 2.4712295532226562, 2.7479023933410645, 3.024576187133789, 3.3012490272521973, 3.5779218673706055, 3.8545949459075928, 4.131267547607422, 4.407940864562988, 4.6846137046813965, 4.961286544799805, 5.237959384918213, 5.514632225036621, 5.791305065155029, 6.0679779052734375, 6.344651222229004, 6.621323585510254, 6.89799690246582, 7.1746697425842285, 7.451342582702637, 7.728015422821045, 8.004688262939453, 8.28136157989502, 8.55803394317627, 8.834707260131836, 9.111379623413086, 9.388052940368652, 9.664726257324219, 9.941399574279785, 10.218071937561035, 10.494745254516602, 10.771417617797852, 11.048090934753418, 11.324763298034668, 11.601436614990234, 11.878108978271484]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 9.0, 10.0, 14.0, 15.0, 34.0, 50.0, 60.0, 113.0, 262.0, 511.0, 1236.0, 3310.0, 10908.0, 43911.0, 185602.0, 460690.0, 256569.0, 62853.0, 15083.0, 4465.0, 1485.0, 644.0, 283.0, 158.0, 98.0, 64.0, 38.0, 23.0, 17.0, 9.0, 7.0, 4.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.9814453125, -0.9538955688476562, -0.9263458251953125, -0.8987960815429688, -0.871246337890625, -0.8436965942382812, -0.8161468505859375, -0.7885971069335938, -0.76104736328125, -0.7334976196289062, -0.7059478759765625, -0.6783981323242188, -0.650848388671875, -0.6232986450195312, -0.5957489013671875, -0.5681991577148438, -0.5406494140625, -0.5130996704101562, -0.4855499267578125, -0.45800018310546875, -0.430450439453125, -0.40290069580078125, -0.3753509521484375, -0.34780120849609375, -0.32025146484375, -0.29270172119140625, -0.2651519775390625, -0.23760223388671875, -0.210052490234375, -0.18250274658203125, -0.1549530029296875, -0.12740325927734375, -0.099853515625, -0.07230377197265625, -0.0447540283203125, -0.01720428466796875, 0.010345458984375, 0.03789520263671875, 0.0654449462890625, 0.09299468994140625, 0.12054443359375, 0.14809417724609375, 0.1756439208984375, 0.20319366455078125, 0.230743408203125, 0.25829315185546875, 0.2858428955078125, 0.31339263916015625, 0.3409423828125, 0.36849212646484375, 0.3960418701171875, 0.42359161376953125, 0.451141357421875, 0.47869110107421875, 0.5062408447265625, 0.5337905883789062, 0.56134033203125, 0.5888900756835938, 0.6164398193359375, 0.6439895629882812, 0.671539306640625, 0.6990890502929688, 0.7266387939453125, 0.7541885375976562, 0.78173828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 14.0, 11.0, 19.0, 16.0, 23.0, 21.0, 32.0, 31.0, 45.0, 39.0, 55.0, 60.0, 56.0, 76.0, 50.0, 66.0, 57.0, 62.0, 47.0, 39.0, 29.0, 37.0, 23.0, 19.0, 19.0, 17.0, 15.0, 3.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.52392578125, -0.5107879638671875, -0.497650146484375, -0.4845123291015625, -0.47137451171875, -0.4582366943359375, -0.445098876953125, -0.4319610595703125, -0.4188232421875, -0.4056854248046875, -0.392547607421875, -0.3794097900390625, -0.36627197265625, -0.3531341552734375, -0.339996337890625, -0.3268585205078125, -0.313720703125, -0.3005828857421875, -0.287445068359375, -0.2743072509765625, -0.26116943359375, -0.2480316162109375, -0.234893798828125, -0.2217559814453125, -0.2086181640625, -0.1954803466796875, -0.182342529296875, -0.1692047119140625, -0.15606689453125, -0.1429290771484375, -0.129791259765625, -0.1166534423828125, -0.103515625, -0.0903778076171875, -0.077239990234375, -0.0641021728515625, -0.05096435546875, -0.0378265380859375, -0.024688720703125, -0.0115509033203125, 0.0015869140625, 0.0147247314453125, 0.027862548828125, 0.0410003662109375, 0.05413818359375, 0.0672760009765625, 0.080413818359375, 0.0935516357421875, 0.106689453125, 0.1198272705078125, 0.132965087890625, 0.1461029052734375, 0.15924072265625, 0.1723785400390625, 0.185516357421875, 0.1986541748046875, 0.2117919921875, 0.2249298095703125, 0.238067626953125, 0.2512054443359375, 0.26434326171875, 0.2774810791015625, 0.290618896484375, 0.3037567138671875, 0.31689453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 3.0, 8.0, 13.0, 17.0, 27.0, 20.0, 46.0, 41.0, 80.0, 100.0, 142.0, 169.0, 275.0, 359.0, 518.0, 813.0, 1315.0, 2586.0, 7046.0, 37800.0, 332249.0, 589506.0, 58574.0, 9443.0, 3062.0, 1432.0, 921.0, 555.0, 383.0, 249.0, 221.0, 164.0, 101.0, 84.0, 61.0, 47.0, 37.0, 20.0, 15.0, 15.0, 9.0, 9.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.2529296875, -1.2172393798828125, -1.181549072265625, -1.1458587646484375, -1.11016845703125, -1.0744781494140625, -1.038787841796875, -1.0030975341796875, -0.9674072265625, -0.9317169189453125, -0.896026611328125, -0.8603363037109375, -0.82464599609375, -0.7889556884765625, -0.753265380859375, -0.7175750732421875, -0.681884765625, -0.6461944580078125, -0.610504150390625, -0.5748138427734375, -0.53912353515625, -0.5034332275390625, -0.467742919921875, -0.4320526123046875, -0.3963623046875, -0.3606719970703125, -0.324981689453125, -0.2892913818359375, -0.25360107421875, -0.2179107666015625, -0.182220458984375, -0.1465301513671875, -0.11083984375, -0.0751495361328125, -0.039459228515625, -0.0037689208984375, 0.03192138671875, 0.0676116943359375, 0.103302001953125, 0.1389923095703125, 0.1746826171875, 0.2103729248046875, 0.246063232421875, 0.2817535400390625, 0.31744384765625, 0.3531341552734375, 0.388824462890625, 0.4245147705078125, 0.460205078125, 0.4958953857421875, 0.531585693359375, 0.5672760009765625, 0.60296630859375, 0.6386566162109375, 0.674346923828125, 0.7100372314453125, 0.7457275390625, 0.7814178466796875, 0.817108154296875, 0.8527984619140625, 0.88848876953125, 0.9241790771484375, 0.959869384765625, 0.9955596923828125, 1.03125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 7.0, 5.0, 16.0, 9.0, 16.0, 11.0, 24.0, 29.0, 34.0, 36.0, 35.0, 44.0, 58.0, 46.0, 43.0, 47.0, 71.0, 41.0, 39.0, 48.0, 44.0, 45.0, 38.0, 27.0, 29.0, 30.0, 16.0, 16.0, 19.0, 12.0, 17.0, 9.0, 11.0, 12.0, 5.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.705078125, -1.6544189453125, -1.603759765625, -1.5531005859375, -1.50244140625, -1.4517822265625, -1.401123046875, -1.3504638671875, -1.2998046875, -1.2491455078125, -1.198486328125, -1.1478271484375, -1.09716796875, -1.0465087890625, -0.995849609375, -0.9451904296875, -0.89453125, -0.8438720703125, -0.793212890625, -0.7425537109375, -0.69189453125, -0.6412353515625, -0.590576171875, -0.5399169921875, -0.4892578125, -0.4385986328125, -0.387939453125, -0.3372802734375, -0.28662109375, -0.2359619140625, -0.185302734375, -0.1346435546875, -0.083984375, -0.0333251953125, 0.017333984375, 0.0679931640625, 0.11865234375, 0.1693115234375, 0.219970703125, 0.2706298828125, 0.3212890625, 0.3719482421875, 0.422607421875, 0.4732666015625, 0.52392578125, 0.5745849609375, 0.625244140625, 0.6759033203125, 0.7265625, 0.7772216796875, 0.827880859375, 0.8785400390625, 0.92919921875, 0.9798583984375, 1.030517578125, 1.0811767578125, 1.1318359375, 1.1824951171875, 1.233154296875, 1.2838134765625, 1.33447265625, 1.3851318359375, 1.435791015625, 1.4864501953125, 1.537109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 14.0, 13.0, 28.0, 31.0, 72.0, 135.0, 250.0, 651.0, 2031.0, 10794.0, 145599.0, 827217.0, 53713.0, 5759.0, 1334.0, 450.0, 186.0, 89.0, 84.0, 34.0, 22.0, 18.0, 7.0, 9.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4544677734375, -0.435791015625, -0.4171142578125, -0.3984375, -0.3797607421875, -0.361083984375, -0.3424072265625, -0.32373046875, -0.3050537109375, -0.286376953125, -0.2677001953125, -0.2490234375, -0.2303466796875, -0.211669921875, -0.1929931640625, -0.17431640625, -0.1556396484375, -0.136962890625, -0.1182861328125, -0.099609375, -0.0809326171875, -0.062255859375, -0.0435791015625, -0.02490234375, -0.0062255859375, 0.012451171875, 0.0311279296875, 0.0498046875, 0.0684814453125, 0.087158203125, 0.1058349609375, 0.12451171875, 0.1431884765625, 0.161865234375, 0.1805419921875, 0.19921875, 0.2178955078125, 0.236572265625, 0.2552490234375, 0.27392578125, 0.2926025390625, 0.311279296875, 0.3299560546875, 0.3486328125, 0.3673095703125, 0.385986328125, 0.4046630859375, 0.42333984375, 0.4420166015625, 0.460693359375, 0.4793701171875, 0.498046875, 0.5167236328125, 0.535400390625, 0.5540771484375, 0.57275390625, 0.5914306640625, 0.610107421875, 0.6287841796875, 0.6474609375, 0.6661376953125, 0.684814453125, 0.7034912109375, 0.72216796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 5.0, 10.0, 1.0, 6.0, 10.0, 15.0, 15.0, 19.0, 38.0, 43.0, 46.0, 63.0, 61.0, 76.0, 79.0, 92.0, 94.0, 57.0, 44.0, 47.0, 34.0, 26.0, 18.0, 15.0, 18.0, 19.0, 9.0, 4.0, 8.0, 2.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.867813110351562e-05, -7.628742605447769e-05, -7.389672100543976e-05, -7.150601595640182e-05, -6.911531090736389e-05, -6.672460585832596e-05, -6.433390080928802e-05, -6.194319576025009e-05, -5.955249071121216e-05, -5.7161785662174225e-05, -5.477108061313629e-05, -5.238037556409836e-05, -4.9989670515060425e-05, -4.759896546602249e-05, -4.520826041698456e-05, -4.2817555367946625e-05, -4.042685031890869e-05, -3.803614526987076e-05, -3.5645440220832825e-05, -3.325473517179489e-05, -3.086403012275696e-05, -2.8473325073719025e-05, -2.608262002468109e-05, -2.3691914975643158e-05, -2.1301209926605225e-05, -1.891050487756729e-05, -1.6519799828529358e-05, -1.4129094779491425e-05, -1.1738389730453491e-05, -9.347684681415558e-06, -6.9569796323776245e-06, -4.566274583339691e-06, -2.175569534301758e-06, 2.1513551473617554e-07, 2.605840563774109e-06, 4.996545612812042e-06, 7.387250661849976e-06, 9.777955710887909e-06, 1.2168660759925842e-05, 1.4559365808963776e-05, 1.695007085800171e-05, 1.9340775907039642e-05, 2.1731480956077576e-05, 2.412218600511551e-05, 2.6512891054153442e-05, 2.8903596103191376e-05, 3.129430115222931e-05, 3.368500620126724e-05, 3.6075711250305176e-05, 3.846641629934311e-05, 4.085712134838104e-05, 4.3247826397418976e-05, 4.563853144645691e-05, 4.802923649549484e-05, 5.0419941544532776e-05, 5.281064659357071e-05, 5.520135164260864e-05, 5.7592056691646576e-05, 5.998276174068451e-05, 6.237346678972244e-05, 6.476417183876038e-05, 6.715487688779831e-05, 6.954558193683624e-05, 7.193628698587418e-05, 7.432699203491211e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 13.0, 11.0, 15.0, 30.0, 36.0, 58.0, 83.0, 165.0, 254.0, 491.0, 1054.0, 2689.0, 8412.0, 40940.0, 502482.0, 438362.0, 40301.0, 8251.0, 2626.0, 1007.0, 551.0, 260.0, 165.0, 101.0, 60.0, 44.0, 28.0, 21.0, 18.0, 8.0, 5.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47021484375, -0.45638275146484375, -0.4425506591796875, -0.42871856689453125, -0.414886474609375, -0.40105438232421875, -0.3872222900390625, -0.37339019775390625, -0.35955810546875, -0.34572601318359375, -0.3318939208984375, -0.31806182861328125, -0.304229736328125, -0.29039764404296875, -0.2765655517578125, -0.26273345947265625, -0.2489013671875, -0.23506927490234375, -0.2212371826171875, -0.20740509033203125, -0.193572998046875, -0.17974090576171875, -0.1659088134765625, -0.15207672119140625, -0.13824462890625, -0.12441253662109375, -0.1105804443359375, -0.09674835205078125, -0.082916259765625, -0.06908416748046875, -0.0552520751953125, -0.04141998291015625, -0.027587890625, -0.01375579833984375, 7.62939453125e-05, 0.01390838623046875, 0.027740478515625, 0.04157257080078125, 0.0554046630859375, 0.06923675537109375, 0.08306884765625, 0.09690093994140625, 0.1107330322265625, 0.12456512451171875, 0.138397216796875, 0.15222930908203125, 0.1660614013671875, 0.17989349365234375, 0.1937255859375, 0.20755767822265625, 0.2213897705078125, 0.23522186279296875, 0.249053955078125, 0.26288604736328125, 0.2767181396484375, 0.29055023193359375, 0.30438232421875, 0.31821441650390625, 0.3320465087890625, 0.34587860107421875, 0.359710693359375, 0.37354278564453125, 0.3873748779296875, 0.40120697021484375, 0.4150390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 7.0, 3.0, 5.0, 14.0, 15.0, 12.0, 12.0, 17.0, 23.0, 31.0, 31.0, 37.0, 35.0, 40.0, 32.0, 47.0, 62.0, 72.0, 69.0, 53.0, 59.0, 48.0, 34.0, 49.0, 22.0, 27.0, 29.0, 25.0, 20.0, 8.0, 10.0, 8.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.28466796875, -0.27577972412109375, -0.2668914794921875, -0.25800323486328125, -0.249114990234375, -0.24022674560546875, -0.2313385009765625, -0.22245025634765625, -0.21356201171875, -0.20467376708984375, -0.1957855224609375, -0.18689727783203125, -0.178009033203125, -0.16912078857421875, -0.1602325439453125, -0.15134429931640625, -0.1424560546875, -0.13356781005859375, -0.1246795654296875, -0.11579132080078125, -0.106903076171875, -0.09801483154296875, -0.0891265869140625, -0.08023834228515625, -0.07135009765625, -0.06246185302734375, -0.0535736083984375, -0.04468536376953125, -0.035797119140625, -0.02690887451171875, -0.0180206298828125, -0.00913238525390625, -0.000244140625, 0.00864410400390625, 0.0175323486328125, 0.02642059326171875, 0.035308837890625, 0.04419708251953125, 0.0530853271484375, 0.06197357177734375, 0.07086181640625, 0.07975006103515625, 0.0886383056640625, 0.09752655029296875, 0.106414794921875, 0.11530303955078125, 0.1241912841796875, 0.13307952880859375, 0.1419677734375, 0.15085601806640625, 0.1597442626953125, 0.16863250732421875, 0.177520751953125, 0.18640899658203125, 0.1952972412109375, 0.20418548583984375, 0.21307373046875, 0.22196197509765625, 0.2308502197265625, 0.23973846435546875, 0.248626708984375, 0.25751495361328125, 0.2664031982421875, 0.27529144287109375, 0.2841796875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 8.0, 6.0, 11.0, 49.0, 122.0, 293.0, 299.0, 131.0, 47.0, 18.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.055168151855469, -11.624258041381836, -11.193347930908203, -10.76243782043457, -10.331526756286621, -9.900616645812988, -9.469706535339355, -9.038796424865723, -8.60788631439209, -8.176976203918457, -7.746065616607666, -7.315155506134033, -6.8842453956604, -6.453334808349609, -6.022424697875977, -5.591514587402344, -5.160604000091553, -4.72969388961792, -4.298783302307129, -3.867873191833496, -3.4369630813598633, -3.0060527324676514, -2.5751423835754395, -2.1442322731018066, -1.7133219242095947, -1.2824116945266724, -0.8515014052391052, -0.4205911159515381, 0.010319113731384277, 0.44122934341430664, 0.8721396923065186, 1.3030498027801514, 1.7339601516723633, 2.164870500564575, 2.595780611038208, 3.02669095993042, 3.4576010704040527, 3.8885114192962646, 4.319421768188477, 4.750331878662109, 5.181241989135742, 5.612152099609375, 6.043062686920166, 6.473972797393799, 6.904882907867432, 7.335793495178223, 7.7667036056518555, 8.197613716125488, 8.628524780273438, 9.05943489074707, 9.490345001220703, 9.921255111694336, 10.352166175842285, 10.783076286315918, 11.21398639678955, 11.644896507263184, 12.075806617736816, 12.50671672821045, 12.937626838684082, 13.368537902832031, 13.799448013305664, 14.230358123779297, 14.66126823425293, 15.092178344726562, 15.523088455200195]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 6.0, 11.0, 9.0, 11.0, 11.0, 21.0, 29.0, 30.0, 35.0, 36.0, 50.0, 52.0, 68.0, 88.0, 97.0, 78.0, 53.0, 57.0, 43.0, 39.0, 33.0, 35.0, 28.0, 20.0, 14.0, 18.0, 7.0, 6.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.397326469421387, -6.133326053619385, -5.869325637817383, -5.605325222015381, -5.341324806213379, -5.077323913574219, -4.813323497772217, -4.549323081970215, -4.285322666168213, -4.021322250366211, -3.757321834564209, -3.493321180343628, -3.229320764541626, -2.965320348739624, -2.701319694519043, -2.437319278717041, -2.173318862915039, -1.909318447113037, -1.6453179121017456, -1.381317377090454, -1.1173169612884521, -0.8533165454864502, -0.5893160104751587, -0.3253154754638672, -0.061315059661865234, 0.2026854157447815, 0.4666858911514282, 0.730686366558075, 0.9946868419647217, 1.2586872577667236, 1.5226877927780151, 1.7866883277893066, 2.0506887435913086, 2.3146891593933105, 2.5786895751953125, 2.8426902294158936, 3.1066906452178955, 3.3706910610198975, 3.6346917152404785, 3.8986921310424805, 4.162692546844482, 4.426692962646484, 4.690693378448486, 4.954693794250488, 5.218694686889648, 5.482694625854492, 5.746695518493652, 6.010695934295654, 6.274696350097656, 6.538696765899658, 6.80269718170166, 7.066697597503662, 7.330698013305664, 7.594698905944824, 7.858699321746826, 8.122699737548828, 8.386699676513672, 8.650700569152832, 8.914700508117676, 9.178701400756836, 9.44270133972168, 9.70670223236084, 9.970702171325684, 10.234703063964844, 10.498703956604004]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 11.0, 6.0, 8.0, 13.0, 10.0, 17.0, 32.0, 53.0, 57.0, 111.0, 238.0, 573.0, 1710.0, 6501.0, 34786.0, 409029.0, 3316914.0, 381750.0, 33058.0, 6379.0, 1670.0, 650.0, 308.0, 151.0, 81.0, 55.0, 41.0, 19.0, 19.0, 12.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9287109375, -0.90325927734375, -0.8778076171875, -0.85235595703125, -0.826904296875, -0.80145263671875, -0.7760009765625, -0.75054931640625, -0.72509765625, -0.69964599609375, -0.6741943359375, -0.64874267578125, -0.623291015625, -0.59783935546875, -0.5723876953125, -0.54693603515625, -0.521484375, -0.49603271484375, -0.4705810546875, -0.44512939453125, -0.419677734375, -0.39422607421875, -0.3687744140625, -0.34332275390625, -0.31787109375, -0.29241943359375, -0.2669677734375, -0.24151611328125, -0.216064453125, -0.19061279296875, -0.1651611328125, -0.13970947265625, -0.1142578125, -0.08880615234375, -0.0633544921875, -0.03790283203125, -0.012451171875, 0.01300048828125, 0.0384521484375, 0.06390380859375, 0.08935546875, 0.11480712890625, 0.1402587890625, 0.16571044921875, 0.191162109375, 0.21661376953125, 0.2420654296875, 0.26751708984375, 0.29296875, 0.31842041015625, 0.3438720703125, 0.36932373046875, 0.394775390625, 0.42022705078125, 0.4456787109375, 0.47113037109375, 0.49658203125, 0.52203369140625, 0.5474853515625, 0.57293701171875, 0.598388671875, 0.62384033203125, 0.6492919921875, 0.67474365234375, 0.7001953125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 8.0, 14.0, 11.0, 25.0, 19.0, 47.0, 47.0, 59.0, 72.0, 73.0, 108.0, 76.0, 79.0, 90.0, 56.0, 49.0, 40.0, 43.0, 34.0, 15.0, 11.0, 10.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3408203125, -0.32404327392578125, -0.3072662353515625, -0.29048919677734375, -0.273712158203125, -0.25693511962890625, -0.2401580810546875, -0.22338104248046875, -0.20660400390625, -0.18982696533203125, -0.1730499267578125, -0.15627288818359375, -0.139495849609375, -0.12271881103515625, -0.1059417724609375, -0.08916473388671875, -0.0723876953125, -0.05561065673828125, -0.0388336181640625, -0.02205657958984375, -0.005279541015625, 0.01149749755859375, 0.0282745361328125, 0.04505157470703125, 0.06182861328125, 0.07860565185546875, 0.0953826904296875, 0.11215972900390625, 0.128936767578125, 0.14571380615234375, 0.1624908447265625, 0.17926788330078125, 0.196044921875, 0.21282196044921875, 0.2295989990234375, 0.24637603759765625, 0.263153076171875, 0.27993011474609375, 0.2967071533203125, 0.31348419189453125, 0.33026123046875, 0.34703826904296875, 0.3638153076171875, 0.38059234619140625, 0.397369384765625, 0.41414642333984375, 0.4309234619140625, 0.44770050048828125, 0.4644775390625, 0.48125457763671875, 0.4980316162109375, 0.5148086547851562, 0.531585693359375, 0.5483627319335938, 0.5651397705078125, 0.5819168090820312, 0.59869384765625, 0.6154708862304688, 0.6322479248046875, 0.6490249633789062, 0.665802001953125, 0.6825790405273438, 0.6993560791015625, 0.7161331176757812, 0.73291015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 12.0, 10.0, 13.0, 25.0, 24.0, 40.0, 72.0, 104.0, 187.0, 314.0, 575.0, 1175.0, 3163.0, 9716.0, 38475.0, 243415.0, 2991290.0, 796814.0, 80377.0, 18413.0, 5558.0, 2096.0, 1010.0, 556.0, 331.0, 178.0, 110.0, 81.0, 46.0, 33.0, 15.0, 12.0, 11.0, 4.0, 10.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5908203125, -0.5694961547851562, -0.5481719970703125, -0.5268478393554688, -0.505523681640625, -0.48419952392578125, -0.4628753662109375, -0.44155120849609375, -0.42022705078125, -0.39890289306640625, -0.3775787353515625, -0.35625457763671875, -0.334930419921875, -0.31360626220703125, -0.2922821044921875, -0.27095794677734375, -0.2496337890625, -0.22830963134765625, -0.2069854736328125, -0.18566131591796875, -0.164337158203125, -0.14301300048828125, -0.1216888427734375, -0.10036468505859375, -0.07904052734375, -0.05771636962890625, -0.0363922119140625, -0.01506805419921875, 0.006256103515625, 0.02758026123046875, 0.0489044189453125, 0.07022857666015625, 0.091552734375, 0.11287689208984375, 0.1342010498046875, 0.15552520751953125, 0.176849365234375, 0.19817352294921875, 0.2194976806640625, 0.24082183837890625, 0.26214599609375, 0.28347015380859375, 0.3047943115234375, 0.32611846923828125, 0.347442626953125, 0.36876678466796875, 0.3900909423828125, 0.41141510009765625, 0.4327392578125, 0.45406341552734375, 0.4753875732421875, 0.49671173095703125, 0.518035888671875, 0.5393600463867188, 0.5606842041015625, 0.5820083618164062, 0.60333251953125, 0.6246566772460938, 0.6459808349609375, 0.6673049926757812, 0.688629150390625, 0.7099533081054688, 0.7312774658203125, 0.7526016235351562, 0.77392578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 7.0, 15.0, 28.0, 33.0, 58.0, 104.0, 245.0, 386.0, 782.0, 902.0, 673.0, 348.0, 204.0, 96.0, 55.0, 40.0, 21.0, 24.0, 15.0, 9.0, 7.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82763671875, -0.7949752807617188, -0.7623138427734375, -0.7296524047851562, -0.696990966796875, -0.6643295288085938, -0.6316680908203125, -0.5990066528320312, -0.56634521484375, -0.5336837768554688, -0.5010223388671875, -0.46836090087890625, -0.435699462890625, -0.40303802490234375, -0.3703765869140625, -0.33771514892578125, -0.3050537109375, -0.27239227294921875, -0.2397308349609375, -0.20706939697265625, -0.174407958984375, -0.14174652099609375, -0.1090850830078125, -0.07642364501953125, -0.04376220703125, -0.01110076904296875, 0.0215606689453125, 0.05422210693359375, 0.086883544921875, 0.11954498291015625, 0.1522064208984375, 0.18486785888671875, 0.217529296875, 0.25019073486328125, 0.2828521728515625, 0.31551361083984375, 0.348175048828125, 0.38083648681640625, 0.4134979248046875, 0.44615936279296875, 0.47882080078125, 0.5114822387695312, 0.5441436767578125, 0.5768051147460938, 0.609466552734375, 0.6421279907226562, 0.6747894287109375, 0.7074508666992188, 0.7401123046875, 0.7727737426757812, 0.8054351806640625, 0.8380966186523438, 0.870758056640625, 0.9034194946289062, 0.9360809326171875, 0.9687423706054688, 1.00140380859375, 1.0340652465820312, 1.0667266845703125, 1.0993881225585938, 1.132049560546875, 1.1647109985351562, 1.1973724365234375, 1.2300338745117188, 1.2626953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 13.0, 22.0, 105.0, 233.0, 305.0, 174.0, 76.0, 27.0, 16.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.742885589599609, -5.364243507385254, -4.985601902008057, -4.606959819793701, -4.228318214416504, -3.8496761322021484, -3.471034049987793, -3.0923922061920166, -2.7137503623962402, -2.335108518600464, -1.956466555595398, -1.577824592590332, -1.1991827487945557, -0.8205409049987793, -0.44189882278442383, -0.06325697898864746, 0.3153848648071289, 0.69402676820755, 1.0726686716079712, 1.451310634613037, 1.8299524784088135, 2.20859432220459, 2.5872364044189453, 2.9658782482147217, 3.344520092010498, 3.7231619358062744, 4.101803779602051, 4.480445861816406, 4.859087944030762, 5.237729549407959, 5.6163716316223145, 5.995013236999512, 6.373655319213867, 6.752297401428223, 7.13093900680542, 7.509581089019775, 7.888222694396973, 8.266864776611328, 8.645506858825684, 9.024148941040039, 9.402790069580078, 9.781432151794434, 10.160074234008789, 10.538715362548828, 10.917357444763184, 11.295999526977539, 11.674641609191895, 12.05328369140625, 12.431925773620605, 12.810567855834961, 13.189209938049316, 13.567852020263672, 13.946493148803711, 14.325135231018066, 14.703777313232422, 15.082419395446777, 15.461061477661133, 15.839703559875488, 16.218345642089844, 16.596986770629883, 16.975629806518555, 17.354270935058594, 17.732913970947266, 18.111555099487305, 18.490196228027344]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 8.0, 15.0, 15.0, 28.0, 41.0, 58.0, 44.0, 61.0, 74.0, 56.0, 69.0, 69.0, 71.0, 68.0, 48.0, 57.0, 45.0, 33.0, 39.0, 17.0, 25.0, 15.0, 11.0, 9.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.110647678375244, -5.93239164352417, -5.754136085510254, -5.57588005065918, -5.3976240158081055, -5.219367980957031, -5.041112422943115, -4.862856388092041, -4.684600830078125, -4.506344795227051, -4.328089237213135, -4.1498332023620605, -3.9715771675109863, -3.793321371078491, -3.615065574645996, -3.436809539794922, -3.2585535049438477, -3.0802977085113525, -2.9020416736602783, -2.723785877227783, -2.545529842376709, -2.367274045944214, -2.1890182495117188, -2.0107622146606445, -1.8325064182281494, -1.6542505025863647, -1.47599458694458, -1.297738790512085, -1.1194828748703003, -0.9412269592285156, -0.7629711627960205, -0.5847152471542358, -0.4064598083496094, -0.2282039225101471, -0.049948036670684814, 0.12830781936645508, 0.30656373500823975, 0.4848196506500244, 0.6630754470825195, 0.8413313627243042, 1.0195872783660889, 1.1978431940078735, 1.3760991096496582, 1.5543549060821533, 1.732610821723938, 1.9108667373657227, 2.0891225337982178, 2.267378330230713, 2.445634365081787, 2.6238901615142822, 2.8021461963653564, 2.9804019927978516, 3.158658027648926, 3.336913824081421, 3.515169620513916, 3.6934256553649902, 3.8716814517974854, 4.0499372482299805, 4.228193283081055, 4.406449317932129, 4.584704875946045, 4.762960910797119, 4.941216468811035, 5.119472503662109, 5.297728538513184]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 11.0, 10.0, 17.0, 24.0, 28.0, 43.0, 87.0, 140.0, 271.0, 554.0, 1215.0, 2678.0, 7009.0, 21716.0, 73315.0, 248842.0, 424743.0, 187575.0, 54362.0, 16230.0, 5448.0, 2194.0, 971.0, 489.0, 238.0, 143.0, 60.0, 49.0, 29.0, 21.0, 10.0, 10.0, 8.0, 1.0, 2.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59228515625, -0.5689468383789062, -0.5456085205078125, -0.5222702026367188, -0.498931884765625, -0.47559356689453125, -0.4522552490234375, -0.42891693115234375, -0.40557861328125, -0.38224029541015625, -0.3589019775390625, -0.33556365966796875, -0.312225341796875, -0.28888702392578125, -0.2655487060546875, -0.24221038818359375, -0.2188720703125, -0.19553375244140625, -0.1721954345703125, -0.14885711669921875, -0.125518798828125, -0.10218048095703125, -0.0788421630859375, -0.05550384521484375, -0.03216552734375, -0.00882720947265625, 0.0145111083984375, 0.03784942626953125, 0.061187744140625, 0.08452606201171875, 0.1078643798828125, 0.13120269775390625, 0.154541015625, 0.17787933349609375, 0.2012176513671875, 0.22455596923828125, 0.247894287109375, 0.27123260498046875, 0.2945709228515625, 0.31790924072265625, 0.34124755859375, 0.36458587646484375, 0.3879241943359375, 0.41126251220703125, 0.434600830078125, 0.45793914794921875, 0.4812774658203125, 0.5046157836914062, 0.5279541015625, 0.5512924194335938, 0.5746307373046875, 0.5979690551757812, 0.621307373046875, 0.6446456909179688, 0.6679840087890625, 0.6913223266601562, 0.71466064453125, 0.7379989624023438, 0.7613372802734375, 0.7846755981445312, 0.808013916015625, 0.8313522338867188, 0.8546905517578125, 0.8780288696289062, 0.9013671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 7.0, 6.0, 9.0, 12.0, 14.0, 13.0, 16.0, 25.0, 43.0, 28.0, 35.0, 46.0, 53.0, 56.0, 56.0, 68.0, 51.0, 53.0, 52.0, 43.0, 45.0, 43.0, 47.0, 30.0, 26.0, 23.0, 30.0, 14.0, 8.0, 8.0, 16.0, 7.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32666015625, -0.3155059814453125, -0.304351806640625, -0.2931976318359375, -0.28204345703125, -0.2708892822265625, -0.259735107421875, -0.2485809326171875, -0.2374267578125, -0.2262725830078125, -0.215118408203125, -0.2039642333984375, -0.19281005859375, -0.1816558837890625, -0.170501708984375, -0.1593475341796875, -0.148193359375, -0.1370391845703125, -0.125885009765625, -0.1147308349609375, -0.10357666015625, -0.0924224853515625, -0.081268310546875, -0.0701141357421875, -0.0589599609375, -0.0478057861328125, -0.036651611328125, -0.0254974365234375, -0.01434326171875, -0.0031890869140625, 0.007965087890625, 0.0191192626953125, 0.0302734375, 0.0414276123046875, 0.052581787109375, 0.0637359619140625, 0.07489013671875, 0.0860443115234375, 0.097198486328125, 0.1083526611328125, 0.1195068359375, 0.1306610107421875, 0.141815185546875, 0.1529693603515625, 0.16412353515625, 0.1752777099609375, 0.186431884765625, 0.1975860595703125, 0.208740234375, 0.2198944091796875, 0.231048583984375, 0.2422027587890625, 0.25335693359375, 0.2645111083984375, 0.275665283203125, 0.2868194580078125, 0.2979736328125, 0.3091278076171875, 0.320281982421875, 0.3314361572265625, 0.34259033203125, 0.3537445068359375, 0.364898681640625, 0.3760528564453125, 0.38720703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 10.0, 3.0, 7.0, 15.0, 13.0, 19.0, 32.0, 38.0, 74.0, 69.0, 116.0, 197.0, 267.0, 398.0, 639.0, 1189.0, 2453.0, 7884.0, 46130.0, 530862.0, 402582.0, 42908.0, 7272.0, 2390.0, 1125.0, 644.0, 395.0, 246.0, 180.0, 121.0, 82.0, 52.0, 44.0, 28.0, 20.0, 15.0, 13.0, 8.0, 0.0, 3.0, 10.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.28125, -1.2435455322265625, -1.205841064453125, -1.1681365966796875, -1.13043212890625, -1.0927276611328125, -1.055023193359375, -1.0173187255859375, -0.9796142578125, -0.9419097900390625, -0.904205322265625, -0.8665008544921875, -0.82879638671875, -0.7910919189453125, -0.753387451171875, -0.7156829833984375, -0.677978515625, -0.6402740478515625, -0.602569580078125, -0.5648651123046875, -0.52716064453125, -0.4894561767578125, -0.451751708984375, -0.4140472412109375, -0.3763427734375, -0.3386383056640625, -0.300933837890625, -0.2632293701171875, -0.22552490234375, -0.1878204345703125, -0.150115966796875, -0.1124114990234375, -0.07470703125, -0.0370025634765625, 0.000701904296875, 0.0384063720703125, 0.07611083984375, 0.1138153076171875, 0.151519775390625, 0.1892242431640625, 0.2269287109375, 0.2646331787109375, 0.302337646484375, 0.3400421142578125, 0.37774658203125, 0.4154510498046875, 0.453155517578125, 0.4908599853515625, 0.528564453125, 0.5662689208984375, 0.603973388671875, 0.6416778564453125, 0.67938232421875, 0.7170867919921875, 0.754791259765625, 0.7924957275390625, 0.8302001953125, 0.8679046630859375, 0.905609130859375, 0.9433135986328125, 0.98101806640625, 1.0187225341796875, 1.056427001953125, 1.0941314697265625, 1.1318359375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 12.0, 5.0, 9.0, 13.0, 19.0, 27.0, 24.0, 30.0, 30.0, 51.0, 44.0, 55.0, 72.0, 67.0, 70.0, 67.0, 75.0, 52.0, 50.0, 34.0, 30.0, 35.0, 28.0, 22.0, 15.0, 8.0, 11.0, 4.0, 15.0, 6.0, 4.0, 1.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5771484375, -1.531494140625, -1.48583984375, -1.440185546875, -1.39453125, -1.348876953125, -1.30322265625, -1.257568359375, -1.2119140625, -1.166259765625, -1.12060546875, -1.074951171875, -1.029296875, -0.983642578125, -0.93798828125, -0.892333984375, -0.8466796875, -0.801025390625, -0.75537109375, -0.709716796875, -0.6640625, -0.618408203125, -0.57275390625, -0.527099609375, -0.4814453125, -0.435791015625, -0.39013671875, -0.344482421875, -0.298828125, -0.253173828125, -0.20751953125, -0.161865234375, -0.1162109375, -0.070556640625, -0.02490234375, 0.020751953125, 0.06640625, 0.112060546875, 0.15771484375, 0.203369140625, 0.2490234375, 0.294677734375, 0.34033203125, 0.385986328125, 0.431640625, 0.477294921875, 0.52294921875, 0.568603515625, 0.6142578125, 0.659912109375, 0.70556640625, 0.751220703125, 0.796875, 0.842529296875, 0.88818359375, 0.933837890625, 0.9794921875, 1.025146484375, 1.07080078125, 1.116455078125, 1.162109375, 1.207763671875, 1.25341796875, 1.299072265625, 1.3447265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 9.0, 8.0, 13.0, 18.0, 18.0, 43.0, 58.0, 69.0, 123.0, 147.0, 279.0, 428.0, 932.0, 2250.0, 6936.0, 28160.0, 132295.0, 603332.0, 212058.0, 45099.0, 10645.0, 3041.0, 1205.0, 560.0, 295.0, 156.0, 118.0, 73.0, 53.0, 32.0, 14.0, 25.0, 14.0, 9.0, 12.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.274658203125, -0.2662467956542969, -0.25783538818359375, -0.24942398071289062, -0.2410125732421875, -0.23260116577148438, -0.22418975830078125, -0.21577835083007812, -0.207366943359375, -0.19895553588867188, -0.19054412841796875, -0.18213272094726562, -0.1737213134765625, -0.16530990600585938, -0.15689849853515625, -0.14848709106445312, -0.14007568359375, -0.13166427612304688, -0.12325286865234375, -0.11484146118164062, -0.1064300537109375, -0.09801864624023438, -0.08960723876953125, -0.08119583129882812, -0.072784423828125, -0.06437301635742188, -0.05596160888671875, -0.047550201416015625, -0.0391387939453125, -0.030727386474609375, -0.02231597900390625, -0.013904571533203125, -0.0054931640625, 0.002918243408203125, 0.01132965087890625, 0.019741058349609375, 0.0281524658203125, 0.036563873291015625, 0.04497528076171875, 0.053386688232421875, 0.061798095703125, 0.07020950317382812, 0.07862091064453125, 0.08703231811523438, 0.0954437255859375, 0.10385513305664062, 0.11226654052734375, 0.12067794799804688, 0.12908935546875, 0.13750076293945312, 0.14591217041015625, 0.15432357788085938, 0.1627349853515625, 0.17114639282226562, 0.17955780029296875, 0.18796920776367188, 0.196380615234375, 0.20479202270507812, 0.21320343017578125, 0.22161483764648438, 0.2300262451171875, 0.23843765258789062, 0.24684906005859375, 0.2552604675292969, 0.263671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 8.0, 9.0, 16.0, 11.0, 20.0, 26.0, 29.0, 44.0, 44.0, 51.0, 60.0, 59.0, 72.0, 73.0, 69.0, 75.0, 41.0, 62.0, 33.0, 36.0, 16.0, 22.0, 20.0, 15.0, 8.0, 11.0, 5.0, 11.0, 5.0, 4.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7756900787353516e-05, -5.570054054260254e-05, -5.364418029785156e-05, -5.1587820053100586e-05, -4.953145980834961e-05, -4.747509956359863e-05, -4.5418739318847656e-05, -4.336237907409668e-05, -4.13060188293457e-05, -3.9249658584594727e-05, -3.719329833984375e-05, -3.5136938095092773e-05, -3.30805778503418e-05, -3.102421760559082e-05, -2.8967857360839844e-05, -2.6911497116088867e-05, -2.485513687133789e-05, -2.2798776626586914e-05, -2.0742416381835938e-05, -1.868605613708496e-05, -1.6629695892333984e-05, -1.4573335647583008e-05, -1.2516975402832031e-05, -1.0460615158081055e-05, -8.404254913330078e-06, -6.3478946685791016e-06, -4.291534423828125e-06, -2.2351741790771484e-06, -1.7881393432617188e-07, 1.8775463104248047e-06, 3.933906555175781e-06, 5.990266799926758e-06, 8.046627044677734e-06, 1.0102987289428711e-05, 1.2159347534179688e-05, 1.4215707778930664e-05, 1.627206802368164e-05, 1.8328428268432617e-05, 2.0384788513183594e-05, 2.244114875793457e-05, 2.4497509002685547e-05, 2.6553869247436523e-05, 2.86102294921875e-05, 3.0666589736938477e-05, 3.272294998168945e-05, 3.477931022644043e-05, 3.6835670471191406e-05, 3.889203071594238e-05, 4.094839096069336e-05, 4.3004751205444336e-05, 4.506111145019531e-05, 4.711747169494629e-05, 4.9173831939697266e-05, 5.123019218444824e-05, 5.328655242919922e-05, 5.5342912673950195e-05, 5.739927291870117e-05, 5.945563316345215e-05, 6.151199340820312e-05, 6.35683536529541e-05, 6.562471389770508e-05, 6.768107414245605e-05, 6.973743438720703e-05, 7.179379463195801e-05, 7.385015487670898e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 0.0, 4.0, 9.0, 5.0, 9.0, 9.0, 12.0, 30.0, 45.0, 53.0, 91.0, 135.0, 237.0, 364.0, 731.0, 1394.0, 3183.0, 9380.0, 37882.0, 184714.0, 613579.0, 151388.0, 31429.0, 8094.0, 2869.0, 1233.0, 683.0, 392.0, 197.0, 124.0, 87.0, 57.0, 40.0, 29.0, 22.0, 13.0, 12.0, 6.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.3022613525390625, -0.293731689453125, -0.2852020263671875, -0.27667236328125, -0.2681427001953125, -0.259613037109375, -0.2510833740234375, -0.2425537109375, -0.2340240478515625, -0.225494384765625, -0.2169647216796875, -0.20843505859375, -0.1999053955078125, -0.191375732421875, -0.1828460693359375, -0.17431640625, -0.1657867431640625, -0.157257080078125, -0.1487274169921875, -0.14019775390625, -0.1316680908203125, -0.123138427734375, -0.1146087646484375, -0.1060791015625, -0.0975494384765625, -0.089019775390625, -0.0804901123046875, -0.07196044921875, -0.0634307861328125, -0.054901123046875, -0.0463714599609375, -0.037841796875, -0.0293121337890625, -0.020782470703125, -0.0122528076171875, -0.00372314453125, 0.0048065185546875, 0.013336181640625, 0.0218658447265625, 0.0303955078125, 0.0389251708984375, 0.047454833984375, 0.0559844970703125, 0.06451416015625, 0.0730438232421875, 0.081573486328125, 0.0901031494140625, 0.0986328125, 0.1071624755859375, 0.115692138671875, 0.1242218017578125, 0.13275146484375, 0.1412811279296875, 0.149810791015625, 0.1583404541015625, 0.1668701171875, 0.1753997802734375, 0.183929443359375, 0.1924591064453125, 0.20098876953125, 0.2095184326171875, 0.218048095703125, 0.2265777587890625, 0.235107421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 6.0, 11.0, 8.0, 16.0, 12.0, 19.0, 20.0, 26.0, 31.0, 39.0, 36.0, 56.0, 52.0, 61.0, 62.0, 68.0, 55.0, 62.0, 51.0, 41.0, 48.0, 41.0, 28.0, 30.0, 20.0, 17.0, 16.0, 4.0, 7.0, 14.0, 9.0, 4.0, 10.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.273681640625, -0.26654815673828125, -0.2594146728515625, -0.25228118896484375, -0.245147705078125, -0.23801422119140625, -0.2308807373046875, -0.22374725341796875, -0.21661376953125, -0.20948028564453125, -0.2023468017578125, -0.19521331787109375, -0.188079833984375, -0.18094635009765625, -0.1738128662109375, -0.16667938232421875, -0.1595458984375, -0.15241241455078125, -0.1452789306640625, -0.13814544677734375, -0.131011962890625, -0.12387847900390625, -0.1167449951171875, -0.10961151123046875, -0.10247802734375, -0.09534454345703125, -0.0882110595703125, -0.08107757568359375, -0.073944091796875, -0.06681060791015625, -0.0596771240234375, -0.05254364013671875, -0.04541015625, -0.03827667236328125, -0.0311431884765625, -0.02400970458984375, -0.016876220703125, -0.00974273681640625, -0.0026092529296875, 0.00452423095703125, 0.01165771484375, 0.01879119873046875, 0.0259246826171875, 0.03305816650390625, 0.040191650390625, 0.04732513427734375, 0.0544586181640625, 0.06159210205078125, 0.0687255859375, 0.07585906982421875, 0.0829925537109375, 0.09012603759765625, 0.097259521484375, 0.10439300537109375, 0.1115264892578125, 0.11865997314453125, 0.12579345703125, 0.13292694091796875, 0.1400604248046875, 0.14719390869140625, 0.154327392578125, 0.16146087646484375, 0.1685943603515625, 0.17572784423828125, 0.182861328125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 18.0, 14.0, 49.0, 128.0, 243.0, 320.0, 143.0, 55.0, 15.0, 4.0, 4.0, 2.0, 0.0, 3.0], "bins": [-20.081356048583984, -19.719009399414062, -19.356664657592773, -18.99431800842285, -18.63197135925293, -18.26962661743164, -17.90727996826172, -17.544933319091797, -17.182586669921875, -16.820240020751953, -16.457895278930664, -16.095548629760742, -15.73320198059082, -15.370856285095215, -15.00851058959961, -14.646163940429688, -14.283819198608398, -13.921473503112793, -13.559126853942871, -13.196781158447266, -12.834434509277344, -12.472088813781738, -12.109743118286133, -11.747396469116211, -11.385049819946289, -11.022704124450684, -10.660357475280762, -10.298011779785156, -9.935665130615234, -9.573319435119629, -9.210973739624023, -8.848627090454102, -8.486282348632812, -8.123936653137207, -7.761590003967285, -7.39924430847168, -7.036898136138916, -6.674551963806152, -6.312205791473389, -5.949859619140625, -5.587512969970703, -5.2251667976379395, -4.862820625305176, -4.50047492980957, -4.138128757476807, -3.775782585144043, -3.4134364128112793, -3.0510904788970947, -2.68874454498291, -2.3263983726501465, -1.964052438735962, -1.6017062664031982, -1.2393602132797241, -0.87701416015625, -0.5146679878234863, -0.15232205390930176, 0.21002411842346191, 0.572370171546936, 0.9347162842750549, 1.2970623970031738, 1.659408450126648, 2.021754503250122, 2.3841006755828857, 2.7464466094970703, 3.108792781829834]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 9.0, 8.0, 11.0, 12.0, 16.0, 14.0, 28.0, 24.0, 27.0, 48.0, 34.0, 43.0, 48.0, 57.0, 71.0, 89.0, 74.0, 51.0, 52.0, 49.0, 27.0, 41.0, 17.0, 20.0, 17.0, 21.0, 14.0, 11.0, 15.0, 9.0, 4.0, 11.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.043880939483643, -4.883065223693848, -4.7222490310668945, -4.5614333152771, -4.400617599487305, -4.23980188369751, -4.078986167907715, -3.9181699752807617, -3.757354259490967, -3.596538543701172, -3.435722589492798, -3.274906635284424, -3.114090919494629, -2.953275203704834, -2.79245924949646, -2.631643295288086, -2.470827579498291, -2.310011863708496, -2.149195909500122, -1.9883800745010376, -1.8275642395019531, -1.6667484045028687, -1.5059325695037842, -1.3451167345046997, -1.1843008995056152, -1.0234850645065308, -0.8626692295074463, -0.7018533945083618, -0.5410375595092773, -0.38022172451019287, -0.2194058895111084, -0.058590054512023926, 0.10222625732421875, 0.2630420923233032, 0.4238579273223877, 0.5846737623214722, 0.7454895973205566, 0.9063054323196411, 1.0671212673187256, 1.22793710231781, 1.3887529373168945, 1.549568772315979, 1.7103846073150635, 1.871200442314148, 2.0320162773132324, 2.1928319931030273, 2.3536479473114014, 2.5144639015197754, 2.6752796173095703, 2.8360953330993652, 2.9969112873077393, 3.1577272415161133, 3.318542957305908, 3.479358673095703, 3.640174627304077, 3.800990581512451, 3.961806297302246, 4.122622013092041, 4.283437728881836, 4.444253921508789, 4.605069637298584, 4.765885353088379, 4.926701545715332, 5.087517261505127, 5.248332977294922]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 4.0, 9.0, 10.0, 21.0, 35.0, 48.0, 81.0, 156.0, 254.0, 544.0, 1508.0, 4665.0, 22190.0, 232088.0, 3267693.0, 614942.0, 38892.0, 7448.0, 2128.0, 776.0, 321.0, 172.0, 100.0, 71.0, 37.0, 25.0, 15.0, 7.0, 14.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58642578125, -0.5626296997070312, -0.5388336181640625, -0.5150375366210938, -0.491241455078125, -0.46744537353515625, -0.4436492919921875, -0.41985321044921875, -0.39605712890625, -0.37226104736328125, -0.3484649658203125, -0.32466888427734375, -0.300872802734375, -0.27707672119140625, -0.2532806396484375, -0.22948455810546875, -0.2056884765625, -0.18189239501953125, -0.1580963134765625, -0.13430023193359375, -0.110504150390625, -0.08670806884765625, -0.0629119873046875, -0.03911590576171875, -0.01531982421875, 0.00847625732421875, 0.0322723388671875, 0.05606842041015625, 0.079864501953125, 0.10366058349609375, 0.1274566650390625, 0.15125274658203125, 0.175048828125, 0.19884490966796875, 0.2226409912109375, 0.24643707275390625, 0.270233154296875, 0.29402923583984375, 0.3178253173828125, 0.34162139892578125, 0.36541748046875, 0.38921356201171875, 0.4130096435546875, 0.43680572509765625, 0.460601806640625, 0.48439788818359375, 0.5081939697265625, 0.5319900512695312, 0.5557861328125, 0.5795822143554688, 0.6033782958984375, 0.6271743774414062, 0.650970458984375, 0.6747665405273438, 0.6985626220703125, 0.7223587036132812, 0.74615478515625, 0.7699508666992188, 0.7937469482421875, 0.8175430297851562, 0.841339111328125, 0.8651351928710938, 0.8889312744140625, 0.9127273559570312, 0.9365234375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 11.0, 11.0, 11.0, 15.0, 15.0, 22.0, 23.0, 21.0, 31.0, 21.0, 36.0, 46.0, 42.0, 65.0, 61.0, 49.0, 51.0, 45.0, 46.0, 36.0, 60.0, 38.0, 45.0, 39.0, 24.0, 24.0, 21.0, 14.0, 11.0, 14.0, 12.0, 11.0, 5.0, 1.0, 4.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.333984375, -0.3247489929199219, -0.31551361083984375, -0.3062782287597656, -0.2970428466796875, -0.2878074645996094, -0.27857208251953125, -0.2693367004394531, -0.260101318359375, -0.2508659362792969, -0.24163055419921875, -0.23239517211914062, -0.2231597900390625, -0.21392440795898438, -0.20468902587890625, -0.19545364379882812, -0.18621826171875, -0.17698287963867188, -0.16774749755859375, -0.15851211547851562, -0.1492767333984375, -0.14004135131835938, -0.13080596923828125, -0.12157058715820312, -0.112335205078125, -0.10309982299804688, -0.09386444091796875, -0.08462905883789062, -0.0753936767578125, -0.06615829467773438, -0.05692291259765625, -0.047687530517578125, -0.0384521484375, -0.029216766357421875, -0.01998138427734375, -0.010746002197265625, -0.0015106201171875, 0.007724761962890625, 0.01696014404296875, 0.026195526123046875, 0.035430908203125, 0.044666290283203125, 0.05390167236328125, 0.06313705444335938, 0.0723724365234375, 0.08160781860351562, 0.09084320068359375, 0.10007858276367188, 0.10931396484375, 0.11854934692382812, 0.12778472900390625, 0.13702011108398438, 0.1462554931640625, 0.15549087524414062, 0.16472625732421875, 0.17396163940429688, 0.183197021484375, 0.19243240356445312, 0.20166778564453125, 0.21090316772460938, 0.2201385498046875, 0.22937393188476562, 0.23860931396484375, 0.24784469604492188, 0.257080078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 11.0, 17.0, 32.0, 49.0, 72.0, 155.0, 323.0, 560.0, 1533.0, 5149.0, 24859.0, 316449.0, 3642266.0, 179366.0, 17410.0, 3765.0, 1150.0, 527.0, 258.0, 135.0, 68.0, 34.0, 32.0, 14.0, 14.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0221481323242188, -0.9915618896484375, -0.9609756469726562, -0.930389404296875, -0.8998031616210938, -0.8692169189453125, -0.8386306762695312, -0.80804443359375, -0.7774581909179688, -0.7468719482421875, -0.7162857055664062, -0.685699462890625, -0.6551132202148438, -0.6245269775390625, -0.5939407348632812, -0.5633544921875, -0.5327682495117188, -0.5021820068359375, -0.47159576416015625, -0.441009521484375, -0.41042327880859375, -0.3798370361328125, -0.34925079345703125, -0.31866455078125, -0.28807830810546875, -0.2574920654296875, -0.22690582275390625, -0.196319580078125, -0.16573333740234375, -0.1351470947265625, -0.10456085205078125, -0.073974609375, -0.04338836669921875, -0.0128021240234375, 0.01778411865234375, 0.048370361328125, 0.07895660400390625, 0.1095428466796875, 0.14012908935546875, 0.17071533203125, 0.20130157470703125, 0.2318878173828125, 0.26247406005859375, 0.293060302734375, 0.32364654541015625, 0.3542327880859375, 0.38481903076171875, 0.4154052734375, 0.44599151611328125, 0.4765777587890625, 0.5071640014648438, 0.537750244140625, 0.5683364868164062, 0.5989227294921875, 0.6295089721679688, 0.66009521484375, 0.6906814575195312, 0.7212677001953125, 0.7518539428710938, 0.782440185546875, 0.8130264282226562, 0.8436126708984375, 0.8741989135742188, 0.90478515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 4.0, 12.0, 7.0, 10.0, 7.0, 17.0, 19.0, 32.0, 45.0, 74.0, 129.0, 182.0, 349.0, 526.0, 688.0, 722.0, 497.0, 292.0, 132.0, 116.0, 62.0, 44.0, 32.0, 20.0, 12.0, 13.0, 7.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.92236328125, -0.8986053466796875, -0.874847412109375, -0.8510894775390625, -0.82733154296875, -0.8035736083984375, -0.779815673828125, -0.7560577392578125, -0.7322998046875, -0.7085418701171875, -0.684783935546875, -0.6610260009765625, -0.63726806640625, -0.6135101318359375, -0.589752197265625, -0.5659942626953125, -0.542236328125, -0.5184783935546875, -0.494720458984375, -0.4709625244140625, -0.44720458984375, -0.4234466552734375, -0.399688720703125, -0.3759307861328125, -0.3521728515625, -0.3284149169921875, -0.304656982421875, -0.2808990478515625, -0.25714111328125, -0.2333831787109375, -0.209625244140625, -0.1858673095703125, -0.162109375, -0.1383514404296875, -0.114593505859375, -0.0908355712890625, -0.06707763671875, -0.0433197021484375, -0.019561767578125, 0.0041961669921875, 0.0279541015625, 0.0517120361328125, 0.075469970703125, 0.0992279052734375, 0.12298583984375, 0.1467437744140625, 0.170501708984375, 0.1942596435546875, 0.218017578125, 0.2417755126953125, 0.265533447265625, 0.2892913818359375, 0.31304931640625, 0.3368072509765625, 0.360565185546875, 0.3843231201171875, 0.4080810546875, 0.4318389892578125, 0.455596923828125, 0.4793548583984375, 0.50311279296875, 0.5268707275390625, 0.550628662109375, 0.5743865966796875, 0.59814453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 14.0, 31.0, 68.0, 120.0, 167.0, 187.0, 183.0, 100.0, 52.0, 30.0, 16.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0898027420043945, -4.85304594039917, -4.616289138793945, -4.379532337188721, -4.142775535583496, -3.9060187339782715, -3.669261932373047, -3.4325051307678223, -3.1957483291625977, -2.958991527557373, -2.7222347259521484, -2.485477924346924, -2.248721122741699, -2.0119643211364746, -1.77520751953125, -1.5384507179260254, -1.3016939163208008, -1.0649371147155762, -0.8281803131103516, -0.591423511505127, -0.35466670989990234, -0.11790990829467773, 0.11884689331054688, 0.3556036949157715, 0.5923604965209961, 0.8291172981262207, 1.0658740997314453, 1.30263090133667, 1.5393877029418945, 1.7761445045471191, 2.0129013061523438, 2.2496581077575684, 2.486414909362793, 2.7231717109680176, 2.959928512573242, 3.196685314178467, 3.4334421157836914, 3.670198917388916, 3.9069557189941406, 4.143712520599365, 4.38046932220459, 4.6172261238098145, 4.853982925415039, 5.090739727020264, 5.327496528625488, 5.564253330230713, 5.8010101318359375, 6.037766933441162, 6.274523735046387, 6.511280536651611, 6.748037338256836, 6.9847941398620605, 7.221550941467285, 7.45830774307251, 7.695064544677734, 7.931821346282959, 8.168578147888184, 8.40533447265625, 8.642091751098633, 8.878849029541016, 9.115605354309082, 9.352361679077148, 9.589118957519531, 9.825876235961914, 10.06263256072998]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 14.0, 13.0, 16.0, 21.0, 27.0, 39.0, 35.0, 41.0, 44.0, 51.0, 55.0, 91.0, 50.0, 62.0, 55.0, 48.0, 54.0, 57.0, 40.0, 30.0, 34.0, 28.0, 21.0, 15.0, 10.0, 12.0, 6.0, 6.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12051248550415, -3.9956350326538086, -3.870757818222046, -3.745880603790283, -3.6210031509399414, -3.4961256980895996, -3.371248483657837, -3.246371269226074, -3.1214938163757324, -2.9966163635253906, -2.871739149093628, -2.7468619346618652, -2.6219844818115234, -2.4971070289611816, -2.372229814529419, -2.2473526000976562, -2.1224751472473145, -1.9975978136062622, -1.87272047996521, -1.7478431463241577, -1.6229658126831055, -1.4980884790420532, -1.373211145401001, -1.2483338117599487, -1.1234564781188965, -0.9985791444778442, -0.873701810836792, -0.7488244771957397, -0.6239471435546875, -0.49906980991363525, -0.374192476272583, -0.24931514263153076, -0.12443804740905762, 0.0004392862319946289, 0.12531661987304688, 0.2501939535140991, 0.37507128715515137, 0.4999486207962036, 0.6248259544372559, 0.7497032880783081, 0.8745806217193604, 0.9994579553604126, 1.1243352890014648, 1.249212622642517, 1.3740899562835693, 1.4989672899246216, 1.6238446235656738, 1.748721957206726, 1.8735992908477783, 1.9984766244888306, 2.123353958129883, 2.2482314109802246, 2.3731086254119873, 2.49798583984375, 2.622863292694092, 2.7477407455444336, 2.8726179599761963, 2.997495174407959, 3.122372627258301, 3.2472500801086426, 3.3721272945404053, 3.497004508972168, 3.6218819618225098, 3.7467594146728516, 3.8716366291046143]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 3.0, 9.0, 9.0, 15.0, 19.0, 24.0, 36.0, 72.0, 97.0, 198.0, 367.0, 700.0, 1501.0, 3333.0, 9044.0, 28027.0, 97554.0, 293362.0, 382472.0, 161451.0, 46940.0, 13984.0, 5029.0, 2169.0, 972.0, 521.0, 262.0, 131.0, 97.0, 51.0, 29.0, 16.0, 13.0, 8.0, 8.0, 9.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7607421875, -0.7391357421875, -0.717529296875, -0.6959228515625, -0.67431640625, -0.6527099609375, -0.631103515625, -0.6094970703125, -0.587890625, -0.5662841796875, -0.544677734375, -0.5230712890625, -0.50146484375, -0.4798583984375, -0.458251953125, -0.4366455078125, -0.4150390625, -0.3934326171875, -0.371826171875, -0.3502197265625, -0.32861328125, -0.3070068359375, -0.285400390625, -0.2637939453125, -0.2421875, -0.2205810546875, -0.198974609375, -0.1773681640625, -0.15576171875, -0.1341552734375, -0.112548828125, -0.0909423828125, -0.0693359375, -0.0477294921875, -0.026123046875, -0.0045166015625, 0.01708984375, 0.0386962890625, 0.060302734375, 0.0819091796875, 0.103515625, 0.1251220703125, 0.146728515625, 0.1683349609375, 0.18994140625, 0.2115478515625, 0.233154296875, 0.2547607421875, 0.2763671875, 0.2979736328125, 0.319580078125, 0.3411865234375, 0.36279296875, 0.3843994140625, 0.406005859375, 0.4276123046875, 0.44921875, 0.4708251953125, 0.492431640625, 0.5140380859375, 0.53564453125, 0.5572509765625, 0.578857421875, 0.6004638671875, 0.6220703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 2.0, 6.0, 10.0, 14.0, 11.0, 17.0, 23.0, 27.0, 35.0, 30.0, 38.0, 41.0, 41.0, 51.0, 60.0, 53.0, 71.0, 41.0, 64.0, 38.0, 45.0, 43.0, 39.0, 35.0, 28.0, 31.0, 21.0, 15.0, 13.0, 10.0, 11.0, 12.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.344482421875, -0.33420562744140625, -0.3239288330078125, -0.31365203857421875, -0.303375244140625, -0.29309844970703125, -0.2828216552734375, -0.27254486083984375, -0.26226806640625, -0.25199127197265625, -0.2417144775390625, -0.23143768310546875, -0.221160888671875, -0.21088409423828125, -0.2006072998046875, -0.19033050537109375, -0.1800537109375, -0.16977691650390625, -0.1595001220703125, -0.14922332763671875, -0.138946533203125, -0.12866973876953125, -0.1183929443359375, -0.10811614990234375, -0.09783935546875, -0.08756256103515625, -0.0772857666015625, -0.06700897216796875, -0.056732177734375, -0.04645538330078125, -0.0361785888671875, -0.02590179443359375, -0.015625, -0.00534820556640625, 0.0049285888671875, 0.01520538330078125, 0.025482177734375, 0.03575897216796875, 0.0460357666015625, 0.05631256103515625, 0.06658935546875, 0.07686614990234375, 0.0871429443359375, 0.09741973876953125, 0.107696533203125, 0.11797332763671875, 0.1282501220703125, 0.13852691650390625, 0.1488037109375, 0.15908050537109375, 0.1693572998046875, 0.17963409423828125, 0.189910888671875, 0.20018768310546875, 0.2104644775390625, 0.22074127197265625, 0.23101806640625, 0.24129486083984375, 0.2515716552734375, 0.26184844970703125, 0.272125244140625, 0.28240203857421875, 0.2926788330078125, 0.30295562744140625, 0.313232421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 5.0, 5.0, 10.0, 7.0, 11.0, 11.0, 23.0, 26.0, 25.0, 44.0, 63.0, 91.0, 118.0, 252.0, 465.0, 984.0, 2740.0, 10557.0, 52131.0, 284272.0, 580017.0, 92336.0, 17556.0, 4143.0, 1324.0, 540.0, 246.0, 159.0, 112.0, 72.0, 41.0, 44.0, 33.0, 24.0, 12.0, 14.0, 6.0, 6.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7841796875, -0.75531005859375, -0.7264404296875, -0.69757080078125, -0.668701171875, -0.63983154296875, -0.6109619140625, -0.58209228515625, -0.55322265625, -0.52435302734375, -0.4954833984375, -0.46661376953125, -0.437744140625, -0.40887451171875, -0.3800048828125, -0.35113525390625, -0.322265625, -0.29339599609375, -0.2645263671875, -0.23565673828125, -0.206787109375, -0.17791748046875, -0.1490478515625, -0.12017822265625, -0.09130859375, -0.06243896484375, -0.0335693359375, -0.00469970703125, 0.024169921875, 0.05303955078125, 0.0819091796875, 0.11077880859375, 0.1396484375, 0.16851806640625, 0.1973876953125, 0.22625732421875, 0.255126953125, 0.28399658203125, 0.3128662109375, 0.34173583984375, 0.37060546875, 0.39947509765625, 0.4283447265625, 0.45721435546875, 0.486083984375, 0.51495361328125, 0.5438232421875, 0.57269287109375, 0.6015625, 0.63043212890625, 0.6593017578125, 0.68817138671875, 0.717041015625, 0.74591064453125, 0.7747802734375, 0.80364990234375, 0.83251953125, 0.86138916015625, 0.8902587890625, 0.91912841796875, 0.947998046875, 0.97686767578125, 1.0057373046875, 1.03460693359375, 1.0634765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 5.0, 2.0, 2.0, 7.0, 15.0, 7.0, 14.0, 12.0, 16.0, 23.0, 18.0, 22.0, 21.0, 21.0, 33.0, 27.0, 22.0, 44.0, 37.0, 41.0, 41.0, 31.0, 45.0, 53.0, 48.0, 28.0, 36.0, 42.0, 23.0, 43.0, 22.0, 25.0, 20.0, 25.0, 22.0, 18.0, 13.0, 9.0, 8.0, 7.0, 9.0, 8.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.82568359375, -0.797943115234375, -0.77020263671875, -0.742462158203125, -0.7147216796875, -0.686981201171875, -0.65924072265625, -0.631500244140625, -0.603759765625, -0.576019287109375, -0.54827880859375, -0.520538330078125, -0.4927978515625, -0.465057373046875, -0.43731689453125, -0.409576416015625, -0.3818359375, -0.354095458984375, -0.32635498046875, -0.298614501953125, -0.2708740234375, -0.243133544921875, -0.21539306640625, -0.187652587890625, -0.159912109375, -0.132171630859375, -0.10443115234375, -0.076690673828125, -0.0489501953125, -0.021209716796875, 0.00653076171875, 0.034271240234375, 0.06201171875, 0.089752197265625, 0.11749267578125, 0.145233154296875, 0.1729736328125, 0.200714111328125, 0.22845458984375, 0.256195068359375, 0.283935546875, 0.311676025390625, 0.33941650390625, 0.367156982421875, 0.3948974609375, 0.422637939453125, 0.45037841796875, 0.478118896484375, 0.505859375, 0.533599853515625, 0.56134033203125, 0.589080810546875, 0.6168212890625, 0.644561767578125, 0.67230224609375, 0.700042724609375, 0.727783203125, 0.755523681640625, 0.78326416015625, 0.811004638671875, 0.8387451171875, 0.866485595703125, 0.89422607421875, 0.921966552734375, 0.94970703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 11.0, 23.0, 51.0, 54.0, 107.0, 199.0, 513.0, 1148.0, 3274.0, 9840.0, 34891.0, 138254.0, 585450.0, 203091.0, 50680.0, 13853.0, 4364.0, 1496.0, 609.0, 274.0, 131.0, 78.0, 55.0, 32.0, 16.0, 10.0, 13.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2978515625, -0.2897224426269531, -0.28159332275390625, -0.2734642028808594, -0.2653350830078125, -0.2572059631347656, -0.24907684326171875, -0.24094772338867188, -0.232818603515625, -0.22468948364257812, -0.21656036376953125, -0.20843124389648438, -0.2003021240234375, -0.19217300415039062, -0.18404388427734375, -0.17591476440429688, -0.16778564453125, -0.15965652465820312, -0.15152740478515625, -0.14339828491210938, -0.1352691650390625, -0.12714004516601562, -0.11901092529296875, -0.11088180541992188, -0.102752685546875, -0.09462356567382812, -0.08649444580078125, -0.07836532592773438, -0.0702362060546875, -0.062107086181640625, -0.05397796630859375, -0.045848846435546875, -0.0377197265625, -0.029590606689453125, -0.02146148681640625, -0.013332366943359375, -0.0052032470703125, 0.002925872802734375, 0.01105499267578125, 0.019184112548828125, 0.027313232421875, 0.035442352294921875, 0.04357147216796875, 0.051700592041015625, 0.0598297119140625, 0.06795883178710938, 0.07608795166015625, 0.08421707153320312, 0.09234619140625, 0.10047531127929688, 0.10860443115234375, 0.11673355102539062, 0.1248626708984375, 0.13299179077148438, 0.14112091064453125, 0.14925003051757812, 0.157379150390625, 0.16550827026367188, 0.17363739013671875, 0.18176651000976562, 0.1898956298828125, 0.19802474975585938, 0.20615386962890625, 0.21428298950195312, 0.222412109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 12.0, 8.0, 13.0, 11.0, 18.0, 22.0, 26.0, 53.0, 60.0, 80.0, 112.0, 91.0, 88.0, 92.0, 71.0, 59.0, 60.0, 24.0, 34.0, 24.0, 11.0, 13.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.104873657226562e-05, -6.851367652416229e-05, -6.597861647605896e-05, -6.344355642795563e-05, -6.0908496379852295e-05, -5.837343633174896e-05, -5.583837628364563e-05, -5.33033162355423e-05, -5.0768256187438965e-05, -4.823319613933563e-05, -4.56981360912323e-05, -4.316307604312897e-05, -4.0628015995025635e-05, -3.80929559469223e-05, -3.555789589881897e-05, -3.302283585071564e-05, -3.0487775802612305e-05, -2.7952715754508972e-05, -2.541765570640564e-05, -2.2882595658302307e-05, -2.0347535610198975e-05, -1.7812475562095642e-05, -1.527741551399231e-05, -1.2742355465888977e-05, -1.0207295417785645e-05, -7.672235369682312e-06, -5.1371753215789795e-06, -2.602115273475647e-06, -6.705522537231445e-08, 2.468004822731018e-06, 5.003064870834351e-06, 7.538124918937683e-06, 1.0073184967041016e-05, 1.2608245015144348e-05, 1.514330506324768e-05, 1.7678365111351013e-05, 2.0213425159454346e-05, 2.2748485207557678e-05, 2.528354525566101e-05, 2.7818605303764343e-05, 3.0353665351867676e-05, 3.288872539997101e-05, 3.542378544807434e-05, 3.795884549617767e-05, 4.0493905544281006e-05, 4.302896559238434e-05, 4.556402564048767e-05, 4.8099085688591003e-05, 5.0634145736694336e-05, 5.316920578479767e-05, 5.5704265832901e-05, 5.8239325881004333e-05, 6.0774385929107666e-05, 6.3309445977211e-05, 6.584450602531433e-05, 6.837956607341766e-05, 7.0914626121521e-05, 7.344968616962433e-05, 7.598474621772766e-05, 7.8519806265831e-05, 8.105486631393433e-05, 8.358992636203766e-05, 8.612498641014099e-05, 8.866004645824432e-05, 9.119510650634766e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 10.0, 5.0, 18.0, 15.0, 20.0, 34.0, 70.0, 142.0, 355.0, 880.0, 3080.0, 16347.0, 124212.0, 708727.0, 167404.0, 21554.0, 3868.0, 1019.0, 401.0, 156.0, 90.0, 58.0, 25.0, 16.0, 20.0, 8.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4814453125, -0.468963623046875, -0.45648193359375, -0.444000244140625, -0.4315185546875, -0.419036865234375, -0.40655517578125, -0.394073486328125, -0.381591796875, -0.369110107421875, -0.35662841796875, -0.344146728515625, -0.3316650390625, -0.319183349609375, -0.30670166015625, -0.294219970703125, -0.28173828125, -0.269256591796875, -0.25677490234375, -0.244293212890625, -0.2318115234375, -0.219329833984375, -0.20684814453125, -0.194366455078125, -0.181884765625, -0.169403076171875, -0.15692138671875, -0.144439697265625, -0.1319580078125, -0.119476318359375, -0.10699462890625, -0.094512939453125, -0.08203125, -0.069549560546875, -0.05706787109375, -0.044586181640625, -0.0321044921875, -0.019622802734375, -0.00714111328125, 0.005340576171875, 0.017822265625, 0.030303955078125, 0.04278564453125, 0.055267333984375, 0.0677490234375, 0.080230712890625, 0.09271240234375, 0.105194091796875, 0.11767578125, 0.130157470703125, 0.14263916015625, 0.155120849609375, 0.1676025390625, 0.180084228515625, 0.19256591796875, 0.205047607421875, 0.217529296875, 0.230010986328125, 0.24249267578125, 0.254974365234375, 0.2674560546875, 0.279937744140625, 0.29241943359375, 0.304901123046875, 0.3173828125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 11.0, 8.0, 20.0, 19.0, 28.0, 32.0, 37.0, 38.0, 51.0, 60.0, 56.0, 65.0, 70.0, 82.0, 60.0, 62.0, 62.0, 44.0, 38.0, 27.0, 17.0, 22.0, 23.0, 14.0, 8.0, 13.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23779296875, -0.22983932495117188, -0.22188568115234375, -0.21393203735351562, -0.2059783935546875, -0.19802474975585938, -0.19007110595703125, -0.18211746215820312, -0.174163818359375, -0.16621017456054688, -0.15825653076171875, -0.15030288696289062, -0.1423492431640625, -0.13439559936523438, -0.12644195556640625, -0.11848831176757812, -0.11053466796875, -0.10258102416992188, -0.09462738037109375, -0.08667373657226562, -0.0787200927734375, -0.07076644897460938, -0.06281280517578125, -0.054859161376953125, -0.046905517578125, -0.038951873779296875, -0.03099822998046875, -0.023044586181640625, -0.0150909423828125, -0.007137298583984375, 0.00081634521484375, 0.008769989013671875, 0.0167236328125, 0.024677276611328125, 0.03263092041015625, 0.040584564208984375, 0.0485382080078125, 0.056491851806640625, 0.06444549560546875, 0.07239913940429688, 0.080352783203125, 0.08830642700195312, 0.09626007080078125, 0.10421371459960938, 0.1121673583984375, 0.12012100219726562, 0.12807464599609375, 0.13602828979492188, 0.14398193359375, 0.15193557739257812, 0.15988922119140625, 0.16784286499023438, 0.1757965087890625, 0.18375015258789062, 0.19170379638671875, 0.19965744018554688, 0.207611083984375, 0.21556472778320312, 0.22351837158203125, 0.23147201538085938, 0.2394256591796875, 0.24737930297851562, 0.25533294677734375, 0.2632865905761719, 0.271240234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 12.0, 22.0, 75.0, 130.0, 308.0, 255.0, 120.0, 43.0, 13.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.501377105712891, -7.187282085418701, -6.873187065124512, -6.559092044830322, -6.244997024536133, -5.930902004241943, -5.616806983947754, -5.302712440490723, -4.988616943359375, -4.6745219230651855, -4.360426902770996, -4.046331882476807, -3.732236862182617, -3.4181418418884277, -3.1040470600128174, -2.789952039718628, -2.4758572578430176, -2.161762237548828, -1.8476672172546387, -1.5335723161697388, -1.2194772958755493, -0.9053822755813599, -0.59128737449646, -0.2771923542022705, 0.036902666091918945, 0.350997656583786, 0.6650926470756531, 0.9791876077651978, 1.2932826280593872, 1.6073776483535767, 1.9214725494384766, 2.235567569732666, 2.5496625900268555, 2.863757610321045, 3.1778526306152344, 3.491947650909424, 3.8060426712036133, 4.120137691497803, 4.434232711791992, 4.748327255249023, 5.062422752380371, 5.3765177726745605, 5.69061279296875, 6.0047078132629395, 6.318802833557129, 6.632897853851318, 6.946992874145508, 7.261087417602539, 7.5751824378967285, 7.889277458190918, 8.20337200164795, 8.517467498779297, 8.831562042236328, 9.145657539367676, 9.459752082824707, 9.773847579956055, 10.087942123413086, 10.402036666870117, 10.716132164001465, 11.030226707458496, 11.344322204589844, 11.658416748046875, 11.972512245178223, 12.286606788635254, 12.600702285766602]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 6.0, 3.0, 4.0, 13.0, 5.0, 8.0, 9.0, 14.0, 16.0, 7.0, 23.0, 12.0, 14.0, 25.0, 28.0, 24.0, 30.0, 30.0, 46.0, 48.0, 70.0, 75.0, 70.0, 56.0, 49.0, 28.0, 42.0, 32.0, 35.0, 27.0, 25.0, 20.0, 16.0, 23.0, 12.0, 13.0, 11.0, 7.0, 4.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.901181221008301, -3.781344413757324, -3.6615076065063477, -3.541670799255371, -3.4218339920043945, -3.301997184753418, -3.1821601390838623, -3.0623233318328857, -2.942486524581909, -2.8226497173309326, -2.702812910079956, -2.5829761028289795, -2.463139057159424, -2.3433022499084473, -2.2234654426574707, -2.103628635406494, -1.9837918281555176, -1.863955020904541, -1.7441182136535645, -1.6242812871932983, -1.5044444799423218, -1.3846076726913452, -1.264770746231079, -1.1449339389801025, -1.025097131729126, -0.9052603244781494, -0.7854234576225281, -0.6655865907669067, -0.5457497835159302, -0.4259129762649536, -0.3060761094093323, -0.18623924255371094, -0.06640267372131348, 0.053434163331985474, 0.17327100038528442, 0.2931078374385834, 0.4129446744918823, 0.5327814817428589, 0.6526183485984802, 0.7724552154541016, 0.8922920227050781, 1.0121288299560547, 1.1319656372070312, 1.2518025636672974, 1.371639370918274, 1.4914761781692505, 1.6113131046295166, 1.7311499118804932, 1.8509867191314697, 1.9708235263824463, 2.090660333633423, 2.2104971408843994, 2.330334186553955, 2.4501709938049316, 2.570007801055908, 2.6898446083068848, 2.8096814155578613, 2.929518222808838, 3.0493550300598145, 3.169191837310791, 3.2890286445617676, 3.408865451812744, 3.5287024974823, 3.6485393047332764, 3.768376111984253]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 3.0, 7.0, 9.0, 21.0, 32.0, 39.0, 64.0, 170.0, 263.0, 520.0, 1288.0, 4660.0, 27286.0, 464856.0, 3397993.0, 270234.0, 20425.0, 4023.0, 1270.0, 505.0, 247.0, 169.0, 68.0, 46.0, 30.0, 15.0, 11.0, 6.0, 3.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7236328125, -0.6981735229492188, -0.6727142333984375, -0.6472549438476562, -0.621795654296875, -0.5963363647460938, -0.5708770751953125, -0.5454177856445312, -0.51995849609375, -0.49449920654296875, -0.4690399169921875, -0.44358062744140625, -0.418121337890625, -0.39266204833984375, -0.3672027587890625, -0.34174346923828125, -0.3162841796875, -0.29082489013671875, -0.2653656005859375, -0.23990631103515625, -0.214447021484375, -0.18898773193359375, -0.1635284423828125, -0.13806915283203125, -0.11260986328125, -0.08715057373046875, -0.0616912841796875, -0.03623199462890625, -0.010772705078125, 0.01468658447265625, 0.0401458740234375, 0.06560516357421875, 0.091064453125, 0.11652374267578125, 0.1419830322265625, 0.16744232177734375, 0.192901611328125, 0.21836090087890625, 0.2438201904296875, 0.26927947998046875, 0.29473876953125, 0.32019805908203125, 0.3456573486328125, 0.37111663818359375, 0.396575927734375, 0.42203521728515625, 0.4474945068359375, 0.47295379638671875, 0.4984130859375, 0.5238723754882812, 0.5493316650390625, 0.5747909545898438, 0.600250244140625, 0.6257095336914062, 0.6511688232421875, 0.6766281127929688, 0.70208740234375, 0.7275466918945312, 0.7530059814453125, 0.7784652709960938, 0.803924560546875, 0.8293838500976562, 0.8548431396484375, 0.8803024291992188, 0.90576171875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 7.0, 10.0, 14.0, 12.0, 14.0, 25.0, 14.0, 33.0, 25.0, 36.0, 41.0, 38.0, 58.0, 51.0, 50.0, 64.0, 50.0, 52.0, 49.0, 51.0, 38.0, 39.0, 42.0, 29.0, 38.0, 18.0, 20.0, 14.0, 17.0, 12.0, 13.0, 6.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.354736328125, -0.34516143798828125, -0.3355865478515625, -0.32601165771484375, -0.316436767578125, -0.30686187744140625, -0.2972869873046875, -0.28771209716796875, -0.27813720703125, -0.26856231689453125, -0.2589874267578125, -0.24941253662109375, -0.239837646484375, -0.23026275634765625, -0.2206878662109375, -0.21111297607421875, -0.2015380859375, -0.19196319580078125, -0.1823883056640625, -0.17281341552734375, -0.163238525390625, -0.15366363525390625, -0.1440887451171875, -0.13451385498046875, -0.12493896484375, -0.11536407470703125, -0.1057891845703125, -0.09621429443359375, -0.086639404296875, -0.07706451416015625, -0.0674896240234375, -0.05791473388671875, -0.04833984375, -0.03876495361328125, -0.0291900634765625, -0.01961517333984375, -0.010040283203125, -0.00046539306640625, 0.0091094970703125, 0.01868438720703125, 0.02825927734375, 0.03783416748046875, 0.0474090576171875, 0.05698394775390625, 0.066558837890625, 0.07613372802734375, 0.0857086181640625, 0.09528350830078125, 0.1048583984375, 0.11443328857421875, 0.1240081787109375, 0.13358306884765625, 0.143157958984375, 0.15273284912109375, 0.1623077392578125, 0.17188262939453125, 0.18145751953125, 0.19103240966796875, 0.2006072998046875, 0.21018218994140625, 0.219757080078125, 0.22933197021484375, 0.2389068603515625, 0.24848175048828125, 0.258056640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 5.0, 8.0, 7.0, 14.0, 27.0, 19.0, 40.0, 62.0, 101.0, 260.0, 680.0, 2533.0, 16629.0, 340358.0, 3715270.0, 107181.0, 8685.0, 1505.0, 443.0, 192.0, 109.0, 45.0, 43.0, 20.0, 17.0, 16.0, 5.0, 6.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0244140625, -0.98828125, -0.9521484375, -0.916015625, -0.8798828125, -0.84375, -0.8076171875, -0.771484375, -0.7353515625, -0.69921875, -0.6630859375, -0.626953125, -0.5908203125, -0.5546875, -0.5185546875, -0.482421875, -0.4462890625, -0.41015625, -0.3740234375, -0.337890625, -0.3017578125, -0.265625, -0.2294921875, -0.193359375, -0.1572265625, -0.12109375, -0.0849609375, -0.048828125, -0.0126953125, 0.0234375, 0.0595703125, 0.095703125, 0.1318359375, 0.16796875, 0.2041015625, 0.240234375, 0.2763671875, 0.3125, 0.3486328125, 0.384765625, 0.4208984375, 0.45703125, 0.4931640625, 0.529296875, 0.5654296875, 0.6015625, 0.6376953125, 0.673828125, 0.7099609375, 0.74609375, 0.7822265625, 0.818359375, 0.8544921875, 0.890625, 0.9267578125, 0.962890625, 0.9990234375, 1.03515625, 1.0712890625, 1.107421875, 1.1435546875, 1.1796875, 1.2158203125, 1.251953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 11.0, 9.0, 21.0, 22.0, 22.0, 44.0, 53.0, 87.0, 123.0, 212.0, 364.0, 559.0, 681.0, 634.0, 461.0, 297.0, 156.0, 100.0, 72.0, 33.0, 33.0, 24.0, 11.0, 10.0, 9.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.666015625, -0.642852783203125, -0.61968994140625, -0.596527099609375, -0.5733642578125, -0.550201416015625, -0.52703857421875, -0.503875732421875, -0.480712890625, -0.457550048828125, -0.43438720703125, -0.411224365234375, -0.3880615234375, -0.364898681640625, -0.34173583984375, -0.318572998046875, -0.29541015625, -0.272247314453125, -0.24908447265625, -0.225921630859375, -0.2027587890625, -0.179595947265625, -0.15643310546875, -0.133270263671875, -0.110107421875, -0.086944580078125, -0.06378173828125, -0.040618896484375, -0.0174560546875, 0.005706787109375, 0.02886962890625, 0.052032470703125, 0.0751953125, 0.098358154296875, 0.12152099609375, 0.144683837890625, 0.1678466796875, 0.191009521484375, 0.21417236328125, 0.237335205078125, 0.260498046875, 0.283660888671875, 0.30682373046875, 0.329986572265625, 0.3531494140625, 0.376312255859375, 0.39947509765625, 0.422637939453125, 0.44580078125, 0.468963623046875, 0.49212646484375, 0.515289306640625, 0.5384521484375, 0.561614990234375, 0.58477783203125, 0.607940673828125, 0.631103515625, 0.654266357421875, 0.67742919921875, 0.700592041015625, 0.7237548828125, 0.746917724609375, 0.77008056640625, 0.793243408203125, 0.81640625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 2.0, 5.0, 3.0, 11.0, 18.0, 24.0, 73.0, 124.0, 208.0, 187.0, 151.0, 102.0, 59.0, 20.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.71927261352539, -11.491153717041016, -11.263035774230957, -11.034916877746582, -10.806797981262207, -10.578680038452148, -10.350561141967773, -10.122442245483398, -9.894323348999023, -9.666204452514648, -9.43808650970459, -9.209967613220215, -8.98184871673584, -8.753730773925781, -8.525611877441406, -8.297492980957031, -8.069375038146973, -7.841256618499756, -7.613137722015381, -7.385019302368164, -7.156900405883789, -6.928781986236572, -6.7006635665893555, -6.4725446701049805, -6.244426250457764, -6.016307830810547, -5.788188934326172, -5.560070514678955, -5.331952095031738, -5.103833198547363, -4.8757147789001465, -4.64759635925293, -4.419477462768555, -4.191359043121338, -3.963240146636963, -3.735121726989746, -3.50700306892395, -3.2788844108581543, -3.0507659912109375, -2.8226473331451416, -2.5945284366607666, -2.3664097785949707, -2.138291358947754, -1.910172700881958, -1.682054042816162, -1.4539353847503662, -1.2258168458938599, -0.9976983070373535, -0.7695796489715576, -0.5414610505104065, -0.31334245204925537, -0.08522385358810425, 0.14289474487304688, 0.3710134029388428, 0.5991319417953491, 0.8272504806518555, 1.0553691387176514, 1.2834877967834473, 1.5116063356399536, 1.73972487449646, 1.9678435325622559, 2.1959621906280518, 2.4240808486938477, 2.6521992683410645, 2.8803179264068604]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 3.0, 2.0, 8.0, 5.0, 8.0, 11.0, 9.0, 14.0, 21.0, 13.0, 18.0, 20.0, 24.0, 20.0, 28.0, 44.0, 30.0, 49.0, 33.0, 47.0, 38.0, 38.0, 42.0, 43.0, 37.0, 36.0, 31.0, 40.0, 27.0, 29.0, 35.0, 25.0, 23.0, 17.0, 17.0, 14.0, 15.0, 13.0, 16.0, 7.0, 9.0, 9.0, 5.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.3750357627868652, -2.2939507961273193, -2.2128658294677734, -2.1317811012268066, -2.0506961345672607, -1.9696111679077148, -1.888526201248169, -1.807441234588623, -1.7263563871383667, -1.6452714204788208, -1.5641865730285645, -1.4831016063690186, -1.4020166397094727, -1.3209317922592163, -1.2398468255996704, -1.158761978149414, -1.0776770114898682, -0.996592104434967, -0.9155071973800659, -0.83442223072052, -0.7533373236656189, -0.6722524166107178, -0.5911674499511719, -0.5100825428962708, -0.42899763584136963, -0.3479127287864685, -0.266827791929245, -0.18574286997318268, -0.10465794801712036, -0.02357304096221924, 0.05751189589500427, 0.13859683275222778, 0.2196817398071289, 0.30076664686203003, 0.38185158371925354, 0.46293652057647705, 0.5440214276313782, 0.6251063346862793, 0.7061913013458252, 0.7872762084007263, 0.8683611154556274, 0.9494460225105286, 1.0305309295654297, 1.1116158962249756, 1.1927008628845215, 1.2737857103347778, 1.3548706769943237, 1.43595552444458, 1.517040491104126, 1.5981254577636719, 1.6792103052139282, 1.7602952718734741, 1.8413801193237305, 1.9224650859832764, 2.0035500526428223, 2.084635019302368, 2.165719985961914, 2.24680495262146, 2.327889919281006, 2.4089746475219727, 2.4900596141815186, 2.5711445808410645, 2.6522295475006104, 2.7333145141601562, 2.814399242401123]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 5.0, 14.0, 26.0, 33.0, 41.0, 58.0, 110.0, 183.0, 325.0, 675.0, 1429.0, 3384.0, 8822.0, 24978.0, 76902.0, 241540.0, 409023.0, 188995.0, 59803.0, 19926.0, 7028.0, 2795.0, 1183.0, 537.0, 333.0, 151.0, 75.0, 63.0, 46.0, 17.0, 14.0, 16.0, 10.0, 3.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.6279296875, -0.6091232299804688, -0.5903167724609375, -0.5715103149414062, -0.552703857421875, -0.5338973999023438, -0.5150909423828125, -0.49628448486328125, -0.47747802734375, -0.45867156982421875, -0.4398651123046875, -0.42105865478515625, -0.402252197265625, -0.38344573974609375, -0.3646392822265625, -0.34583282470703125, -0.3270263671875, -0.30821990966796875, -0.2894134521484375, -0.27060699462890625, -0.251800537109375, -0.23299407958984375, -0.2141876220703125, -0.19538116455078125, -0.17657470703125, -0.15776824951171875, -0.1389617919921875, -0.12015533447265625, -0.101348876953125, -0.08254241943359375, -0.0637359619140625, -0.04492950439453125, -0.026123046875, -0.00731658935546875, 0.0114898681640625, 0.03029632568359375, 0.049102783203125, 0.06790924072265625, 0.0867156982421875, 0.10552215576171875, 0.12432861328125, 0.14313507080078125, 0.1619415283203125, 0.18074798583984375, 0.199554443359375, 0.21836090087890625, 0.2371673583984375, 0.25597381591796875, 0.2747802734375, 0.29358673095703125, 0.3123931884765625, 0.33119964599609375, 0.350006103515625, 0.36881256103515625, 0.3876190185546875, 0.40642547607421875, 0.42523193359375, 0.44403839111328125, 0.4628448486328125, 0.48165130615234375, 0.500457763671875, 0.5192642211914062, 0.5380706787109375, 0.5568771362304688, 0.57568359375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 2.0, 6.0, 10.0, 19.0, 13.0, 17.0, 22.0, 25.0, 34.0, 33.0, 33.0, 41.0, 44.0, 53.0, 52.0, 53.0, 58.0, 58.0, 52.0, 53.0, 54.0, 36.0, 33.0, 34.0, 30.0, 23.0, 18.0, 18.0, 14.0, 17.0, 10.0, 9.0, 3.0, 8.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.361572265625, -0.3513336181640625, -0.341094970703125, -0.3308563232421875, -0.32061767578125, -0.3103790283203125, -0.300140380859375, -0.2899017333984375, -0.2796630859375, -0.2694244384765625, -0.259185791015625, -0.2489471435546875, -0.23870849609375, -0.2284698486328125, -0.218231201171875, -0.2079925537109375, -0.19775390625, -0.1875152587890625, -0.177276611328125, -0.1670379638671875, -0.15679931640625, -0.1465606689453125, -0.136322021484375, -0.1260833740234375, -0.1158447265625, -0.1056060791015625, -0.095367431640625, -0.0851287841796875, -0.07489013671875, -0.0646514892578125, -0.054412841796875, -0.0441741943359375, -0.033935546875, -0.0236968994140625, -0.013458251953125, -0.0032196044921875, 0.00701904296875, 0.0172576904296875, 0.027496337890625, 0.0377349853515625, 0.0479736328125, 0.0582122802734375, 0.068450927734375, 0.0786895751953125, 0.08892822265625, 0.0991668701171875, 0.109405517578125, 0.1196441650390625, 0.1298828125, 0.1401214599609375, 0.150360107421875, 0.1605987548828125, 0.17083740234375, 0.1810760498046875, 0.191314697265625, 0.2015533447265625, 0.2117919921875, 0.2220306396484375, 0.232269287109375, 0.2425079345703125, 0.25274658203125, 0.2629852294921875, 0.273223876953125, 0.2834625244140625, 0.293701171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 13.0, 18.0, 29.0, 49.0, 66.0, 112.0, 151.0, 292.0, 472.0, 972.0, 2669.0, 13201.0, 129919.0, 791153.0, 94442.0, 10557.0, 2349.0, 852.0, 454.0, 282.0, 181.0, 111.0, 79.0, 44.0, 29.0, 18.0, 10.0, 9.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98291015625, -0.9457321166992188, -0.9085540771484375, -0.8713760375976562, -0.834197998046875, -0.7970199584960938, -0.7598419189453125, -0.7226638793945312, -0.68548583984375, -0.6483078002929688, -0.6111297607421875, -0.5739517211914062, -0.536773681640625, -0.49959564208984375, -0.4624176025390625, -0.42523956298828125, -0.3880615234375, -0.35088348388671875, -0.3137054443359375, -0.27652740478515625, -0.239349365234375, -0.20217132568359375, -0.1649932861328125, -0.12781524658203125, -0.09063720703125, -0.05345916748046875, -0.0162811279296875, 0.02089691162109375, 0.058074951171875, 0.09525299072265625, 0.1324310302734375, 0.16960906982421875, 0.206787109375, 0.24396514892578125, 0.2811431884765625, 0.31832122802734375, 0.355499267578125, 0.39267730712890625, 0.4298553466796875, 0.46703338623046875, 0.50421142578125, 0.5413894653320312, 0.5785675048828125, 0.6157455444335938, 0.652923583984375, 0.6901016235351562, 0.7272796630859375, 0.7644577026367188, 0.8016357421875, 0.8388137817382812, 0.8759918212890625, 0.9131698608398438, 0.950347900390625, 0.9875259399414062, 1.0247039794921875, 1.0618820190429688, 1.09906005859375, 1.1362380981445312, 1.1734161376953125, 1.2105941772460938, 1.247772216796875, 1.2849502563476562, 1.3221282958984375, 1.3593063354492188, 1.396484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 5.0, 3.0, 9.0, 13.0, 10.0, 15.0, 23.0, 21.0, 30.0, 42.0, 55.0, 56.0, 52.0, 53.0, 50.0, 64.0, 70.0, 68.0, 53.0, 34.0, 50.0, 42.0, 29.0, 29.0, 19.0, 15.0, 19.0, 13.0, 12.0, 12.0, 5.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4384765625, -1.4010162353515625, -1.363555908203125, -1.3260955810546875, -1.28863525390625, -1.2511749267578125, -1.213714599609375, -1.1762542724609375, -1.1387939453125, -1.1013336181640625, -1.063873291015625, -1.0264129638671875, -0.98895263671875, -0.9514923095703125, -0.914031982421875, -0.8765716552734375, -0.839111328125, -0.8016510009765625, -0.764190673828125, -0.7267303466796875, -0.68927001953125, -0.6518096923828125, -0.614349365234375, -0.5768890380859375, -0.5394287109375, -0.5019683837890625, -0.464508056640625, -0.4270477294921875, -0.38958740234375, -0.3521270751953125, -0.314666748046875, -0.2772064208984375, -0.23974609375, -0.2022857666015625, -0.164825439453125, -0.1273651123046875, -0.08990478515625, -0.0524444580078125, -0.014984130859375, 0.0224761962890625, 0.0599365234375, 0.0973968505859375, 0.134857177734375, 0.1723175048828125, 0.20977783203125, 0.2472381591796875, 0.284698486328125, 0.3221588134765625, 0.359619140625, 0.3970794677734375, 0.434539794921875, 0.4720001220703125, 0.50946044921875, 0.5469207763671875, 0.584381103515625, 0.6218414306640625, 0.6593017578125, 0.6967620849609375, 0.734222412109375, 0.7716827392578125, 0.80914306640625, 0.8466033935546875, 0.884063720703125, 0.9215240478515625, 0.958984375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 3.0, 8.0, 12.0, 15.0, 18.0, 36.0, 71.0, 113.0, 193.0, 334.0, 648.0, 1411.0, 3080.0, 7769.0, 22140.0, 73021.0, 521404.0, 315494.0, 68660.0, 21082.0, 7400.0, 2969.0, 1237.0, 624.0, 315.0, 185.0, 103.0, 73.0, 39.0, 25.0, 20.0, 10.0, 4.0, 8.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.241455078125, -0.2339038848876953, -0.22635269165039062, -0.21880149841308594, -0.21125030517578125, -0.20369911193847656, -0.19614791870117188, -0.1885967254638672, -0.1810455322265625, -0.1734943389892578, -0.16594314575195312, -0.15839195251464844, -0.15084075927734375, -0.14328956604003906, -0.13573837280273438, -0.1281871795654297, -0.120635986328125, -0.11308479309082031, -0.10553359985351562, -0.09798240661621094, -0.09043121337890625, -0.08288002014160156, -0.07532882690429688, -0.06777763366699219, -0.0602264404296875, -0.05267524719238281, -0.045124053955078125, -0.03757286071777344, -0.03002166748046875, -0.022470474243164062, -0.014919281005859375, -0.0073680877685546875, 0.00018310546875, 0.0077342987060546875, 0.015285491943359375, 0.022836685180664062, 0.03038787841796875, 0.03793907165527344, 0.045490264892578125, 0.05304145812988281, 0.0605926513671875, 0.06814384460449219, 0.07569503784179688, 0.08324623107910156, 0.09079742431640625, 0.09834861755371094, 0.10589981079101562, 0.11345100402832031, 0.121002197265625, 0.1285533905029297, 0.13610458374023438, 0.14365577697753906, 0.15120697021484375, 0.15875816345214844, 0.16630935668945312, 0.1738605499267578, 0.1814117431640625, 0.1889629364013672, 0.19651412963867188, 0.20406532287597656, 0.21161651611328125, 0.21916770935058594, 0.22671890258789062, 0.2342700958251953, 0.2418212890625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 3.0, 3.0, 8.0, 14.0, 27.0, 34.0, 28.0, 61.0, 67.0, 131.0, 128.0, 117.0, 93.0, 72.0, 62.0, 26.0, 35.0, 26.0, 15.0, 9.0, 11.0, 5.0, 2.0, 5.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00011235475540161133, -0.00010947417467832565, -0.00010659359395503998, -0.0001037130132317543, -0.00010083243250846863, -9.795185178518295e-05, -9.507127106189728e-05, -9.21906903386116e-05, -8.931010961532593e-05, -8.642952889204025e-05, -8.354894816875458e-05, -8.06683674454689e-05, -7.778778672218323e-05, -7.490720599889755e-05, -7.202662527561188e-05, -6.91460445523262e-05, -6.626546382904053e-05, -6.338488310575485e-05, -6.050430238246918e-05, -5.76237216591835e-05, -5.474314093589783e-05, -5.186256021261215e-05, -4.898197948932648e-05, -4.61013987660408e-05, -4.322081804275513e-05, -4.034023731946945e-05, -3.745965659618378e-05, -3.45790758728981e-05, -3.169849514961243e-05, -2.8817914426326752e-05, -2.5937333703041077e-05, -2.30567529797554e-05, -2.0176172256469727e-05, -1.729559153318405e-05, -1.4415010809898376e-05, -1.1534430086612701e-05, -8.653849363327026e-06, -5.773268640041351e-06, -2.8926879167556763e-06, -1.210719347000122e-08, 2.868473529815674e-06, 5.749054253101349e-06, 8.629634976387024e-06, 1.1510215699672699e-05, 1.4390796422958374e-05, 1.727137714624405e-05, 2.0151957869529724e-05, 2.30325385928154e-05, 2.5913119316101074e-05, 2.879370003938675e-05, 3.1674280762672424e-05, 3.45548614859581e-05, 3.7435442209243774e-05, 4.031602293252945e-05, 4.3196603655815125e-05, 4.60771843791008e-05, 4.8957765102386475e-05, 5.183834582567215e-05, 5.4718926548957825e-05, 5.75995072722435e-05, 6.0480087995529175e-05, 6.336066871881485e-05, 6.624124944210052e-05, 6.91218301653862e-05, 7.200241088867188e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 8.0, 15.0, 23.0, 17.0, 28.0, 54.0, 60.0, 107.0, 156.0, 255.0, 420.0, 749.0, 1487.0, 3322.0, 8438.0, 23998.0, 79742.0, 544925.0, 284143.0, 66698.0, 20406.0, 7379.0, 2941.0, 1341.0, 721.0, 425.0, 245.0, 141.0, 108.0, 61.0, 39.0, 26.0, 25.0, 12.0, 11.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.27197265625, -0.26460838317871094, -0.2572441101074219, -0.2498798370361328, -0.24251556396484375, -0.2351512908935547, -0.22778701782226562, -0.22042274475097656, -0.2130584716796875, -0.20569419860839844, -0.19832992553710938, -0.1909656524658203, -0.18360137939453125, -0.1762371063232422, -0.16887283325195312, -0.16150856018066406, -0.154144287109375, -0.14678001403808594, -0.13941574096679688, -0.1320514678955078, -0.12468719482421875, -0.11732292175292969, -0.10995864868164062, -0.10259437561035156, -0.0952301025390625, -0.08786582946777344, -0.08050155639648438, -0.07313728332519531, -0.06577301025390625, -0.05840873718261719, -0.051044464111328125, -0.04368019104003906, -0.03631591796875, -0.028951644897460938, -0.021587371826171875, -0.014223098754882812, -0.00685882568359375, 0.0005054473876953125, 0.007869720458984375, 0.015233993530273438, 0.0225982666015625, 0.029962539672851562, 0.037326812744140625, 0.04469108581542969, 0.05205535888671875, 0.05941963195800781, 0.06678390502929688, 0.07414817810058594, 0.081512451171875, 0.08887672424316406, 0.09624099731445312, 0.10360527038574219, 0.11096954345703125, 0.11833381652832031, 0.12569808959960938, 0.13306236267089844, 0.1404266357421875, 0.14779090881347656, 0.15515518188476562, 0.1625194549560547, 0.16988372802734375, 0.1772480010986328, 0.18461227416992188, 0.19197654724121094, 0.1993408203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 1.0, 4.0, 6.0, 4.0, 6.0, 6.0, 6.0, 13.0, 18.0, 16.0, 24.0, 40.0, 45.0, 54.0, 71.0, 96.0, 103.0, 96.0, 80.0, 67.0, 66.0, 39.0, 46.0, 23.0, 17.0, 10.0, 13.0, 8.0, 7.0, 10.0, 0.0, 5.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3251953125, -0.3161773681640625, -0.307159423828125, -0.2981414794921875, -0.28912353515625, -0.2801055908203125, -0.271087646484375, -0.2620697021484375, -0.2530517578125, -0.2440338134765625, -0.235015869140625, -0.2259979248046875, -0.21697998046875, -0.2079620361328125, -0.198944091796875, -0.1899261474609375, -0.180908203125, -0.1718902587890625, -0.162872314453125, -0.1538543701171875, -0.14483642578125, -0.1358184814453125, -0.126800537109375, -0.1177825927734375, -0.1087646484375, -0.0997467041015625, -0.090728759765625, -0.0817108154296875, -0.07269287109375, -0.0636749267578125, -0.054656982421875, -0.0456390380859375, -0.03662109375, -0.0276031494140625, -0.018585205078125, -0.0095672607421875, -0.00054931640625, 0.0084686279296875, 0.017486572265625, 0.0265045166015625, 0.0355224609375, 0.0445404052734375, 0.053558349609375, 0.0625762939453125, 0.07159423828125, 0.0806121826171875, 0.089630126953125, 0.0986480712890625, 0.107666015625, 0.1166839599609375, 0.125701904296875, 0.1347198486328125, 0.14373779296875, 0.1527557373046875, 0.161773681640625, 0.1707916259765625, 0.1798095703125, 0.1888275146484375, 0.197845458984375, 0.2068634033203125, 0.21588134765625, 0.2248992919921875, 0.233917236328125, 0.2429351806640625, 0.251953125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 1.0, 9.0, 24.0, 34.0, 82.0, 148.0, 302.0, 211.0, 90.0, 41.0, 25.0, 10.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.440393447875977, -6.190920829772949, -5.941448211669922, -5.6919755935668945, -5.442502975463867, -5.19303035736084, -4.9435577392578125, -4.694085121154785, -4.444612503051758, -4.1951398849487305, -3.945667266845703, -3.696194648742676, -3.4467220306396484, -3.197249412536621, -2.9477767944335938, -2.6983041763305664, -2.448831558227539, -2.1993589401245117, -1.9498863220214844, -1.700413703918457, -1.4509410858154297, -1.2014684677124023, -0.951995849609375, -0.7025232315063477, -0.4530506134033203, -0.20357799530029297, 0.045894622802734375, 0.2953672409057617, 0.5448398590087891, 0.7943124771118164, 1.0437850952148438, 1.293257713317871, 1.5427303314208984, 1.7922029495239258, 2.041675567626953, 2.2911481857299805, 2.540620803833008, 2.790093421936035, 3.0395660400390625, 3.28903865814209, 3.538511276245117, 3.7879838943481445, 4.037456512451172, 4.286929130554199, 4.536401748657227, 4.785874366760254, 5.035346984863281, 5.284819602966309, 5.534292221069336, 5.783764839172363, 6.033237457275391, 6.282710075378418, 6.532182693481445, 6.781655311584473, 7.0311279296875, 7.280600547790527, 7.530073165893555, 7.779545783996582, 8.02901840209961, 8.278491020202637, 8.527963638305664, 8.777436256408691, 9.026908874511719, 9.276381492614746, 9.525854110717773]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 5.0, 6.0, 11.0, 11.0, 13.0, 18.0, 22.0, 23.0, 22.0, 23.0, 21.0, 19.0, 39.0, 52.0, 87.0, 95.0, 124.0, 66.0, 43.0, 34.0, 32.0, 31.0, 22.0, 23.0, 25.0, 22.0, 14.0, 21.0, 11.0, 12.0, 7.0, 12.0, 7.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.863215923309326, -3.7298285961151123, -3.5964412689208984, -3.4630539417266846, -3.3296666145324707, -3.1962790489196777, -3.062891721725464, -2.92950439453125, -2.796117067337036, -2.6627297401428223, -2.5293424129486084, -2.3959550857543945, -2.2625675201416016, -2.129180431365967, -1.9957928657531738, -1.86240553855896, -1.729018211364746, -1.5956308841705322, -1.4622435569763184, -1.328856110572815, -1.195468783378601, -1.0620814561843872, -0.9286940693855286, -0.7953066825866699, -0.661919355392456, -0.5285320281982422, -0.39514464139938354, -0.2617572844028473, -0.12836992740631104, 0.005017399787902832, 0.13840478658676147, 0.2717921733856201, 0.4051799774169922, 0.538567304611206, 0.6719546914100647, 0.8053420782089233, 0.9387294054031372, 1.072116732597351, 1.2055041790008545, 1.3388915061950684, 1.4722788333892822, 1.605666160583496, 1.73905348777771, 1.8724409341812134, 2.005828380584717, 2.1392154693603516, 2.2726030349731445, 2.4059903621673584, 2.5393776893615723, 2.672765016555786, 2.80615234375, 2.939539670944214, 3.0729269981384277, 3.2063145637512207, 3.3397018909454346, 3.4730892181396484, 3.6064765453338623, 3.739863872528076, 3.87325119972229, 4.006638526916504, 4.140026092529297, 4.273413181304932, 4.406800746917725, 4.540187835693359, 4.673575401306152]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 10.0, 8.0, 5.0, 16.0, 17.0, 15.0, 43.0, 47.0, 75.0, 99.0, 120.0, 221.0, 393.0, 701.0, 1649.0, 4536.0, 20237.0, 186845.0, 2503499.0, 1370087.0, 86796.0, 12657.0, 3371.0, 1311.0, 585.0, 279.0, 194.0, 118.0, 78.0, 70.0, 54.0, 32.0, 35.0, 19.0, 14.0, 14.0, 4.0, 8.0, 8.0, 2.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69482421875, -0.67230224609375, -0.6497802734375, -0.62725830078125, -0.604736328125, -0.58221435546875, -0.5596923828125, -0.53717041015625, -0.5146484375, -0.49212646484375, -0.4696044921875, -0.44708251953125, -0.424560546875, -0.40203857421875, -0.3795166015625, -0.35699462890625, -0.33447265625, -0.31195068359375, -0.2894287109375, -0.26690673828125, -0.244384765625, -0.22186279296875, -0.1993408203125, -0.17681884765625, -0.154296875, -0.13177490234375, -0.1092529296875, -0.08673095703125, -0.064208984375, -0.04168701171875, -0.0191650390625, 0.00335693359375, 0.02587890625, 0.04840087890625, 0.0709228515625, 0.09344482421875, 0.115966796875, 0.13848876953125, 0.1610107421875, 0.18353271484375, 0.2060546875, 0.22857666015625, 0.2510986328125, 0.27362060546875, 0.296142578125, 0.31866455078125, 0.3411865234375, 0.36370849609375, 0.38623046875, 0.40875244140625, 0.4312744140625, 0.45379638671875, 0.476318359375, 0.49884033203125, 0.5213623046875, 0.54388427734375, 0.56640625, 0.58892822265625, 0.6114501953125, 0.63397216796875, 0.656494140625, 0.67901611328125, 0.7015380859375, 0.72406005859375, 0.74658203125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 8.0, 17.0, 23.0, 15.0, 22.0, 34.0, 30.0, 43.0, 35.0, 46.0, 61.0, 60.0, 52.0, 77.0, 57.0, 68.0, 41.0, 46.0, 33.0, 37.0, 31.0, 35.0, 28.0, 23.0, 20.0, 10.0, 7.0, 5.0, 8.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37158203125, -0.36011505126953125, -0.3486480712890625, -0.33718109130859375, -0.325714111328125, -0.31424713134765625, -0.3027801513671875, -0.29131317138671875, -0.27984619140625, -0.26837921142578125, -0.2569122314453125, -0.24544525146484375, -0.233978271484375, -0.22251129150390625, -0.2110443115234375, -0.19957733154296875, -0.1881103515625, -0.17664337158203125, -0.1651763916015625, -0.15370941162109375, -0.142242431640625, -0.13077545166015625, -0.1193084716796875, -0.10784149169921875, -0.09637451171875, -0.08490753173828125, -0.0734405517578125, -0.06197357177734375, -0.050506591796875, -0.03903961181640625, -0.0275726318359375, -0.01610565185546875, -0.004638671875, 0.00682830810546875, 0.0182952880859375, 0.02976226806640625, 0.041229248046875, 0.05269622802734375, 0.0641632080078125, 0.07563018798828125, 0.08709716796875, 0.09856414794921875, 0.1100311279296875, 0.12149810791015625, 0.132965087890625, 0.14443206787109375, 0.1558990478515625, 0.16736602783203125, 0.1788330078125, 0.19029998779296875, 0.2017669677734375, 0.21323394775390625, 0.224700927734375, 0.23616790771484375, 0.2476348876953125, 0.25910186767578125, 0.27056884765625, 0.28203582763671875, 0.2935028076171875, 0.30496978759765625, 0.316436767578125, 0.32790374755859375, 0.3393707275390625, 0.35083770751953125, 0.3623046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 5.0, 18.0, 12.0, 35.0, 39.0, 98.0, 185.0, 362.0, 952.0, 4239.0, 59308.0, 3882484.0, 236301.0, 8056.0, 1333.0, 435.0, 190.0, 101.0, 49.0, 23.0, 16.0, 14.0, 7.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.373046875, -1.32513427734375, -1.2772216796875, -1.22930908203125, -1.181396484375, -1.13348388671875, -1.0855712890625, -1.03765869140625, -0.98974609375, -0.94183349609375, -0.8939208984375, -0.84600830078125, -0.798095703125, -0.75018310546875, -0.7022705078125, -0.65435791015625, -0.6064453125, -0.55853271484375, -0.5106201171875, -0.46270751953125, -0.414794921875, -0.36688232421875, -0.3189697265625, -0.27105712890625, -0.22314453125, -0.17523193359375, -0.1273193359375, -0.07940673828125, -0.031494140625, 0.01641845703125, 0.0643310546875, 0.11224365234375, 0.16015625, 0.20806884765625, 0.2559814453125, 0.30389404296875, 0.351806640625, 0.39971923828125, 0.4476318359375, 0.49554443359375, 0.54345703125, 0.59136962890625, 0.6392822265625, 0.68719482421875, 0.735107421875, 0.78302001953125, 0.8309326171875, 0.87884521484375, 0.9267578125, 0.97467041015625, 1.0225830078125, 1.07049560546875, 1.118408203125, 1.16632080078125, 1.2142333984375, 1.26214599609375, 1.31005859375, 1.35797119140625, 1.4058837890625, 1.45379638671875, 1.501708984375, 1.54962158203125, 1.5975341796875, 1.64544677734375, 1.693359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 6.0, 6.0, 13.0, 16.0, 27.0, 42.0, 70.0, 144.0, 259.0, 490.0, 798.0, 920.0, 620.0, 303.0, 158.0, 84.0, 52.0, 22.0, 15.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.591796875, -1.5557022094726562, -1.5196075439453125, -1.4835128784179688, -1.447418212890625, -1.4113235473632812, -1.3752288818359375, -1.3391342163085938, -1.30303955078125, -1.2669448852539062, -1.2308502197265625, -1.1947555541992188, -1.158660888671875, -1.1225662231445312, -1.0864715576171875, -1.0503768920898438, -1.0142822265625, -0.9781875610351562, -0.9420928955078125, -0.9059982299804688, -0.869903564453125, -0.8338088989257812, -0.7977142333984375, -0.7616195678710938, -0.72552490234375, -0.6894302368164062, -0.6533355712890625, -0.6172409057617188, -0.581146240234375, -0.5450515747070312, -0.5089569091796875, -0.47286224365234375, -0.436767578125, -0.40067291259765625, -0.3645782470703125, -0.32848358154296875, -0.292388916015625, -0.25629425048828125, -0.2201995849609375, -0.18410491943359375, -0.14801025390625, -0.11191558837890625, -0.0758209228515625, -0.03972625732421875, -0.003631591796875, 0.03246307373046875, 0.0685577392578125, 0.10465240478515625, 0.1407470703125, 0.17684173583984375, 0.2129364013671875, 0.24903106689453125, 0.285125732421875, 0.32122039794921875, 0.3573150634765625, 0.39340972900390625, 0.42950439453125, 0.46559906005859375, 0.5016937255859375, 0.5377883911132812, 0.573883056640625, 0.6099777221679688, 0.6460723876953125, 0.6821670532226562, 0.71826171875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 13.0, 7.0, 24.0, 33.0, 59.0, 91.0, 133.0, 163.0, 166.0, 124.0, 81.0, 48.0, 21.0, 12.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.421880722045898, -10.205196380615234, -9.988511085510254, -9.77182674407959, -9.55514144897461, -9.338457107543945, -9.121771812438965, -8.9050874710083, -8.68840217590332, -8.471717834472656, -8.255032539367676, -8.038348197937012, -7.821662902832031, -7.604978084564209, -7.388293266296387, -7.1716084480285645, -6.954923629760742, -6.73823881149292, -6.521553993225098, -6.304869174957275, -6.088184356689453, -5.871499538421631, -5.654814720153809, -5.438129901885986, -5.221445560455322, -5.0047607421875, -4.788075923919678, -4.5713911056518555, -4.354706287384033, -4.138021469116211, -3.9213366508483887, -3.7046518325805664, -3.487967014312744, -3.271282196044922, -3.0545973777770996, -2.8379125595092773, -2.621227741241455, -2.404542922973633, -2.1878581047058105, -1.9711734056472778, -1.7544885873794556, -1.5378037691116333, -1.321118950843811, -1.1044342517852783, -0.8877493739128113, -0.6710646152496338, -0.4543797969818115, -0.23769497871398926, -0.021010160446166992, 0.19567464292049408, 0.41235944628715515, 0.629044234752655, 0.8457290530204773, 1.0624138116836548, 1.279098629951477, 1.4957834482192993, 1.7124682664871216, 1.9291530847549438, 2.1458377838134766, 2.362522602081299, 2.579207420349121, 2.7958922386169434, 3.0125770568847656, 3.229261875152588, 3.44594669342041]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 14.0, 17.0, 14.0, 12.0, 21.0, 24.0, 27.0, 31.0, 31.0, 30.0, 38.0, 49.0, 43.0, 55.0, 30.0, 44.0, 50.0, 45.0, 48.0, 49.0, 44.0, 31.0, 27.0, 28.0, 25.0, 27.0, 20.0, 16.0, 16.0, 13.0, 10.0, 13.0, 8.0, 7.0, 12.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2860822677612305, -3.170498847961426, -3.054915189743042, -2.9393317699432373, -2.8237481117248535, -2.708164691925049, -2.592581033706665, -2.4769976139068604, -2.3614139556884766, -2.245830535888672, -2.130246877670288, -2.0146634578704834, -1.8990797996520996, -1.783496379852295, -1.6679127216339111, -1.5523293018341064, -1.4367457628250122, -1.321162223815918, -1.2055786848068237, -1.0899951457977295, -0.9744116067886353, -0.8588281273841858, -0.7432445883750916, -0.6276610493659973, -0.5120775103569031, -0.39649397134780884, -0.2809104323387146, -0.16532692313194275, -0.04974338412284851, 0.06584012508392334, 0.18142366409301758, 0.2970072031021118, 0.41259074211120605, 0.5281742811203003, 0.6437578201293945, 0.7593413591384888, 0.874924898147583, 0.9905083775520325, 1.1060919761657715, 1.2216753959655762, 1.33725905418396, 1.4528425931930542, 1.5684261322021484, 1.6840096712112427, 1.799593210220337, 1.9151766300201416, 2.0307602882385254, 2.14634370803833, 2.2619271278381348, 2.3775105476379395, 2.4930942058563232, 2.608677625656128, 2.7242612838745117, 2.8398447036743164, 2.9554283618927, 3.071011781692505, 3.1865954399108887, 3.3021788597106934, 3.417762517929077, 3.533345937728882, 3.6489295959472656, 3.7645130157470703, 3.880096673965454, 3.995680093765259, 4.111263751983643]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 12.0, 9.0, 29.0, 33.0, 61.0, 88.0, 147.0, 235.0, 425.0, 724.0, 1229.0, 2125.0, 3859.0, 7358.0, 14876.0, 31952.0, 75326.0, 188256.0, 350697.0, 215737.0, 85345.0, 35673.0, 16345.0, 8180.0, 4284.0, 2364.0, 1308.0, 747.0, 440.0, 243.0, 151.0, 97.0, 85.0, 39.0, 25.0, 16.0, 8.0, 7.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.5830078125, -0.5670661926269531, -0.5511245727539062, -0.5351829528808594, -0.5192413330078125, -0.5032997131347656, -0.48735809326171875, -0.4714164733886719, -0.455474853515625, -0.4395332336425781, -0.42359161376953125, -0.4076499938964844, -0.3917083740234375, -0.3757667541503906, -0.35982513427734375, -0.3438835144042969, -0.32794189453125, -0.3120002746582031, -0.29605865478515625, -0.2801170349121094, -0.2641754150390625, -0.24823379516601562, -0.23229217529296875, -0.21635055541992188, -0.200408935546875, -0.18446731567382812, -0.16852569580078125, -0.15258407592773438, -0.1366424560546875, -0.12070083618164062, -0.10475921630859375, -0.08881759643554688, -0.0728759765625, -0.056934356689453125, -0.04099273681640625, -0.025051116943359375, -0.0091094970703125, 0.006832122802734375, 0.02277374267578125, 0.038715362548828125, 0.054656982421875, 0.07059860229492188, 0.08654022216796875, 0.10248184204101562, 0.1184234619140625, 0.13436508178710938, 0.15030670166015625, 0.16624832153320312, 0.18218994140625, 0.19813156127929688, 0.21407318115234375, 0.23001480102539062, 0.2459564208984375, 0.2618980407714844, 0.27783966064453125, 0.2937812805175781, 0.309722900390625, 0.3256645202636719, 0.34160614013671875, 0.3575477600097656, 0.3734893798828125, 0.3894309997558594, 0.40537261962890625, 0.4213142395019531, 0.437255859375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 4.0, 9.0, 7.0, 11.0, 9.0, 11.0, 18.0, 28.0, 41.0, 26.0, 42.0, 33.0, 51.0, 42.0, 43.0, 57.0, 55.0, 76.0, 65.0, 50.0, 41.0, 39.0, 38.0, 34.0, 28.0, 33.0, 24.0, 11.0, 14.0, 13.0, 7.0, 14.0, 9.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.373779296875, -0.3620338439941406, -0.35028839111328125, -0.3385429382324219, -0.3267974853515625, -0.3150520324707031, -0.30330657958984375, -0.2915611267089844, -0.279815673828125, -0.2680702209472656, -0.25632476806640625, -0.24457931518554688, -0.2328338623046875, -0.22108840942382812, -0.20934295654296875, -0.19759750366210938, -0.18585205078125, -0.17410659790039062, -0.16236114501953125, -0.15061569213867188, -0.1388702392578125, -0.12712478637695312, -0.11537933349609375, -0.10363388061523438, -0.091888427734375, -0.08014297485351562, -0.06839752197265625, -0.056652069091796875, -0.0449066162109375, -0.033161163330078125, -0.02141571044921875, -0.009670257568359375, 0.0020751953125, 0.013820648193359375, 0.02556610107421875, 0.037311553955078125, 0.0490570068359375, 0.060802459716796875, 0.07254791259765625, 0.08429336547851562, 0.096038818359375, 0.10778427124023438, 0.11952972412109375, 0.13127517700195312, 0.1430206298828125, 0.15476608276367188, 0.16651153564453125, 0.17825698852539062, 0.19000244140625, 0.20174789428710938, 0.21349334716796875, 0.22523880004882812, 0.2369842529296875, 0.24872970581054688, 0.26047515869140625, 0.2722206115722656, 0.283966064453125, 0.2957115173339844, 0.30745697021484375, 0.3192024230957031, 0.3309478759765625, 0.3426933288574219, 0.35443878173828125, 0.3661842346191406, 0.3779296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 6.0, 4.0, 5.0, 14.0, 13.0, 16.0, 25.0, 32.0, 41.0, 55.0, 83.0, 107.0, 148.0, 216.0, 287.0, 471.0, 765.0, 1352.0, 3118.0, 12097.0, 106648.0, 822981.0, 83297.0, 10430.0, 2788.0, 1300.0, 747.0, 455.0, 277.0, 210.0, 132.0, 119.0, 73.0, 55.0, 44.0, 30.0, 29.0, 24.0, 9.0, 12.0, 6.0, 8.0, 5.0, 2.0, 4.0, 0.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.123046875, -1.0849151611328125, -1.046783447265625, -1.0086517333984375, -0.97052001953125, -0.9323883056640625, -0.894256591796875, -0.8561248779296875, -0.8179931640625, -0.7798614501953125, -0.741729736328125, -0.7035980224609375, -0.66546630859375, -0.6273345947265625, -0.589202880859375, -0.5510711669921875, -0.512939453125, -0.4748077392578125, -0.436676025390625, -0.3985443115234375, -0.36041259765625, -0.3222808837890625, -0.284149169921875, -0.2460174560546875, -0.2078857421875, -0.1697540283203125, -0.131622314453125, -0.0934906005859375, -0.05535888671875, -0.0172271728515625, 0.020904541015625, 0.0590362548828125, 0.09716796875, 0.1352996826171875, 0.173431396484375, 0.2115631103515625, 0.24969482421875, 0.2878265380859375, 0.325958251953125, 0.3640899658203125, 0.4022216796875, 0.4403533935546875, 0.478485107421875, 0.5166168212890625, 0.55474853515625, 0.5928802490234375, 0.631011962890625, 0.6691436767578125, 0.707275390625, 0.7454071044921875, 0.783538818359375, 0.8216705322265625, 0.85980224609375, 0.8979339599609375, 0.936065673828125, 0.9741973876953125, 1.0123291015625, 1.0504608154296875, 1.088592529296875, 1.1267242431640625, 1.16485595703125, 1.2029876708984375, 1.241119384765625, 1.2792510986328125, 1.3173828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 5.0, 7.0, 8.0, 20.0, 15.0, 17.0, 17.0, 22.0, 30.0, 29.0, 41.0, 33.0, 44.0, 68.0, 75.0, 72.0, 65.0, 53.0, 54.0, 46.0, 47.0, 38.0, 42.0, 25.0, 26.0, 15.0, 14.0, 16.0, 8.0, 5.0, 5.0, 7.0, 7.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5498046875, -1.5025177001953125, -1.455230712890625, -1.4079437255859375, -1.36065673828125, -1.3133697509765625, -1.266082763671875, -1.2187957763671875, -1.1715087890625, -1.1242218017578125, -1.076934814453125, -1.0296478271484375, -0.98236083984375, -0.9350738525390625, -0.887786865234375, -0.8404998779296875, -0.793212890625, -0.7459259033203125, -0.698638916015625, -0.6513519287109375, -0.60406494140625, -0.5567779541015625, -0.509490966796875, -0.4622039794921875, -0.4149169921875, -0.3676300048828125, -0.320343017578125, -0.2730560302734375, -0.22576904296875, -0.1784820556640625, -0.131195068359375, -0.0839080810546875, -0.03662109375, 0.0106658935546875, 0.057952880859375, 0.1052398681640625, 0.15252685546875, 0.1998138427734375, 0.247100830078125, 0.2943878173828125, 0.3416748046875, 0.3889617919921875, 0.436248779296875, 0.4835357666015625, 0.53082275390625, 0.5781097412109375, 0.625396728515625, 0.6726837158203125, 0.719970703125, 0.7672576904296875, 0.814544677734375, 0.8618316650390625, 0.90911865234375, 0.9564056396484375, 1.003692626953125, 1.0509796142578125, 1.0982666015625, 1.1455535888671875, 1.192840576171875, 1.2401275634765625, 1.28741455078125, 1.3347015380859375, 1.381988525390625, 1.4292755126953125, 1.4765625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 11.0, 16.0, 16.0, 22.0, 38.0, 58.0, 95.0, 185.0, 443.0, 1019.0, 3183.0, 13945.0, 104359.0, 826193.0, 82502.0, 11945.0, 2707.0, 931.0, 351.0, 194.0, 117.0, 80.0, 48.0, 22.0, 19.0, 18.0, 13.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.346435546875, -0.3360786437988281, -0.32572174072265625, -0.3153648376464844, -0.3050079345703125, -0.2946510314941406, -0.28429412841796875, -0.2739372253417969, -0.263580322265625, -0.2532234191894531, -0.24286651611328125, -0.23250961303710938, -0.2221527099609375, -0.21179580688476562, -0.20143890380859375, -0.19108200073242188, -0.18072509765625, -0.17036819458007812, -0.16001129150390625, -0.14965438842773438, -0.1392974853515625, -0.12894058227539062, -0.11858367919921875, -0.10822677612304688, -0.097869873046875, -0.08751296997070312, -0.07715606689453125, -0.06679916381835938, -0.0564422607421875, -0.046085357666015625, -0.03572845458984375, -0.025371551513671875, -0.0150146484375, -0.004657745361328125, 0.00569915771484375, 0.016056060791015625, 0.0264129638671875, 0.036769866943359375, 0.04712677001953125, 0.057483673095703125, 0.067840576171875, 0.07819747924804688, 0.08855438232421875, 0.09891128540039062, 0.1092681884765625, 0.11962509155273438, 0.12998199462890625, 0.14033889770507812, 0.15069580078125, 0.16105270385742188, 0.17140960693359375, 0.18176651000976562, 0.1921234130859375, 0.20248031616210938, 0.21283721923828125, 0.22319412231445312, 0.233551025390625, 0.24390792846679688, 0.25426483154296875, 0.2646217346191406, 0.2749786376953125, 0.2853355407714844, 0.29569244384765625, 0.3060493469238281, 0.31640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 12.0, 13.0, 11.0, 15.0, 21.0, 23.0, 20.0, 25.0, 28.0, 46.0, 47.0, 69.0, 61.0, 94.0, 80.0, 66.0, 49.0, 56.0, 42.0, 34.0, 26.0, 30.0, 19.0, 17.0, 13.0, 10.0, 10.0, 10.0, 7.0, 6.0, 6.0, 1.0, 3.0, 4.0, 4.0, 0.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125999450683594e-05, -4.9598515033721924e-05, -4.793703556060791e-05, -4.6275556087493896e-05, -4.461407661437988e-05, -4.295259714126587e-05, -4.1291117668151855e-05, -3.962963819503784e-05, -3.796815872192383e-05, -3.6306679248809814e-05, -3.46451997756958e-05, -3.298372030258179e-05, -3.1322240829467773e-05, -2.966076135635376e-05, -2.7999281883239746e-05, -2.6337802410125732e-05, -2.467632293701172e-05, -2.3014843463897705e-05, -2.135336399078369e-05, -1.9691884517669678e-05, -1.8030405044555664e-05, -1.636892557144165e-05, -1.4707446098327637e-05, -1.3045966625213623e-05, -1.138448715209961e-05, -9.723007678985596e-06, -8.061528205871582e-06, -6.400048732757568e-06, -4.738569259643555e-06, -3.077089786529541e-06, -1.4156103134155273e-06, 2.4586915969848633e-07, 1.9073486328125e-06, 3.5688281059265137e-06, 5.230307579040527e-06, 6.891787052154541e-06, 8.553266525268555e-06, 1.0214745998382568e-05, 1.1876225471496582e-05, 1.3537704944610596e-05, 1.519918441772461e-05, 1.6860663890838623e-05, 1.8522143363952637e-05, 2.018362283706665e-05, 2.1845102310180664e-05, 2.3506581783294678e-05, 2.516806125640869e-05, 2.6829540729522705e-05, 2.849102020263672e-05, 3.0152499675750732e-05, 3.1813979148864746e-05, 3.347545862197876e-05, 3.5136938095092773e-05, 3.679841756820679e-05, 3.84598970413208e-05, 4.0121376514434814e-05, 4.178285598754883e-05, 4.344433546066284e-05, 4.5105814933776855e-05, 4.676729440689087e-05, 4.842877388000488e-05, 5.0090253353118896e-05, 5.175173282623291e-05, 5.3413212299346924e-05, 5.507469177246094e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 7.0, 9.0, 25.0, 32.0, 63.0, 93.0, 213.0, 483.0, 1031.0, 2874.0, 12381.0, 114285.0, 833485.0, 70880.0, 8844.0, 2262.0, 779.0, 376.0, 203.0, 83.0, 55.0, 38.0, 23.0, 12.0, 3.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376220703125, -0.3658866882324219, -0.35555267333984375, -0.3452186584472656, -0.3348846435546875, -0.3245506286621094, -0.31421661376953125, -0.3038825988769531, -0.293548583984375, -0.2832145690917969, -0.27288055419921875, -0.2625465393066406, -0.2522125244140625, -0.24187850952148438, -0.23154449462890625, -0.22121047973632812, -0.21087646484375, -0.20054244995117188, -0.19020843505859375, -0.17987442016601562, -0.1695404052734375, -0.15920639038085938, -0.14887237548828125, -0.13853836059570312, -0.128204345703125, -0.11787033081054688, -0.10753631591796875, -0.09720230102539062, -0.0868682861328125, -0.07653427124023438, -0.06620025634765625, -0.055866241455078125, -0.0455322265625, -0.035198211669921875, -0.02486419677734375, -0.014530181884765625, -0.0041961669921875, 0.006137847900390625, 0.01647186279296875, 0.026805877685546875, 0.037139892578125, 0.047473907470703125, 0.05780792236328125, 0.06814193725585938, 0.0784759521484375, 0.08880996704101562, 0.09914398193359375, 0.10947799682617188, 0.11981201171875, 0.13014602661132812, 0.14048004150390625, 0.15081405639648438, 0.1611480712890625, 0.17148208618164062, 0.18181610107421875, 0.19215011596679688, 0.202484130859375, 0.21281814575195312, 0.22315216064453125, 0.23348617553710938, 0.2438201904296875, 0.2541542053222656, 0.26448822021484375, 0.2748222351074219, 0.28515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 8.0, 15.0, 21.0, 20.0, 28.0, 44.0, 38.0, 58.0, 82.0, 90.0, 98.0, 88.0, 86.0, 70.0, 63.0, 56.0, 39.0, 23.0, 23.0, 10.0, 12.0, 5.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146240234375, -0.13813400268554688, -0.13002777099609375, -0.12192153930664062, -0.1138153076171875, -0.10570907592773438, -0.09760284423828125, -0.08949661254882812, -0.081390380859375, -0.07328414916992188, -0.06517791748046875, -0.057071685791015625, -0.0489654541015625, -0.040859222412109375, -0.03275299072265625, -0.024646759033203125, -0.01654052734375, -0.008434295654296875, -0.00032806396484375, 0.007778167724609375, 0.0158843994140625, 0.023990631103515625, 0.03209686279296875, 0.040203094482421875, 0.048309326171875, 0.056415557861328125, 0.06452178955078125, 0.07262802124023438, 0.0807342529296875, 0.08884048461914062, 0.09694671630859375, 0.10505294799804688, 0.1131591796875, 0.12126541137695312, 0.12937164306640625, 0.13747787475585938, 0.1455841064453125, 0.15369033813476562, 0.16179656982421875, 0.16990280151367188, 0.178009033203125, 0.18611526489257812, 0.19422149658203125, 0.20232772827148438, 0.2104339599609375, 0.21854019165039062, 0.22664642333984375, 0.23475265502929688, 0.24285888671875, 0.2509651184082031, 0.25907135009765625, 0.2671775817871094, 0.2752838134765625, 0.2833900451660156, 0.29149627685546875, 0.2996025085449219, 0.307708740234375, 0.3158149719238281, 0.32392120361328125, 0.3320274353027344, 0.3401336669921875, 0.3482398986816406, 0.35634613037109375, 0.3644523620605469, 0.37255859375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 4.0, 5.0, 10.0, 20.0, 49.0, 116.0, 336.0, 269.0, 91.0, 50.0, 24.0, 16.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.845046997070312, -8.539398193359375, -8.233749389648438, -7.928099632263184, -7.622450828552246, -7.316802024841309, -7.011152744293213, -6.705503463745117, -6.39985466003418, -6.094205856323242, -5.7885565757751465, -5.482907295227051, -5.177258491516113, -4.871609687805176, -4.56596040725708, -4.260311126708984, -3.954662322998047, -3.6490132808685303, -3.3433642387390137, -3.037715196609497, -2.7320661544799805, -2.426417112350464, -2.1207680702209473, -1.8151190280914307, -1.509469985961914, -1.2038209438323975, -0.8981719017028809, -0.5925228595733643, -0.28687381744384766, 0.018775224685668945, 0.32442426681518555, 0.6300733089447021, 0.9357233047485352, 1.2413723468780518, 1.5470213890075684, 1.852670431137085, 2.1583194732666016, 2.463968515396118, 2.7696175575256348, 3.0752665996551514, 3.380915641784668, 3.6865646839141846, 3.992213726043701, 4.297863006591797, 4.603511810302734, 4.909160614013672, 5.214809894561768, 5.520459175109863, 5.826107978820801, 6.131756782531738, 6.437406063079834, 6.74305534362793, 7.048704147338867, 7.354352951049805, 7.6600022315979, 7.965651512145996, 8.271300315856934, 8.576949119567871, 8.882598876953125, 9.188247680664062, 9.493896484375, 9.799545288085938, 10.105194091796875, 10.410843849182129, 10.716492652893066]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 6.0, 4.0, 2.0, 5.0, 8.0, 5.0, 11.0, 13.0, 18.0, 12.0, 12.0, 23.0, 19.0, 22.0, 31.0, 26.0, 37.0, 25.0, 50.0, 99.0, 166.0, 89.0, 47.0, 39.0, 26.0, 22.0, 21.0, 22.0, 18.0, 19.0, 21.0, 14.0, 7.0, 6.0, 8.0, 8.0, 8.0, 7.0, 2.0, 4.0, 3.0, 2.0, 9.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.150975227355957, -4.969811916351318, -4.788649082183838, -4.607485771179199, -4.426322937011719, -4.24515962600708, -4.063996315002441, -3.882833480834961, -3.7016704082489014, -3.520507335662842, -3.3393442630767822, -3.1581811904907227, -2.977017879486084, -2.7958550453186035, -2.614691734313965, -2.4335286617279053, -2.2523655891418457, -2.071202516555786, -1.8900394439697266, -1.7088762521743774, -1.5277131795883179, -1.3465501070022583, -1.1653869152069092, -0.9842238426208496, -0.80306077003479, -0.6218976974487305, -0.4407345652580261, -0.2595714330673218, -0.07840836048126221, 0.10275471210479736, 0.2839179039001465, 0.46508097648620605, 0.6462440490722656, 0.8274071216583252, 1.0085701942443848, 1.1897333860397339, 1.3708964586257935, 1.552059531211853, 1.7332227230072021, 1.9143857955932617, 2.0955488681793213, 2.276711940765381, 2.4578750133514404, 2.6390380859375, 2.8202013969421387, 3.001364231109619, 3.182527542114258, 3.3636906147003174, 3.544853687286377, 3.7260167598724365, 3.907179832458496, 4.088343143463135, 4.269505977630615, 4.450669288635254, 4.631832122802734, 4.812995433807373, 4.994158744812012, 5.17532205581665, 5.356484889984131, 5.5376482009887695, 5.71881103515625, 5.899974346160889, 6.081137657165527, 6.262300491333008, 6.443463325500488]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 7.0, 12.0, 10.0, 12.0, 26.0, 47.0, 71.0, 145.0, 244.0, 512.0, 943.0, 2315.0, 6326.0, 26968.0, 222531.0, 1947236.0, 1757586.0, 193331.0, 25206.0, 6272.0, 2332.0, 1036.0, 520.0, 257.0, 129.0, 80.0, 47.0, 26.0, 13.0, 10.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.85986328125, -0.8352737426757812, -0.8106842041015625, -0.7860946655273438, -0.761505126953125, -0.7369155883789062, -0.7123260498046875, -0.6877365112304688, -0.66314697265625, -0.6385574340820312, -0.6139678955078125, -0.5893783569335938, -0.564788818359375, -0.5401992797851562, -0.5156097412109375, -0.49102020263671875, -0.4664306640625, -0.44184112548828125, -0.4172515869140625, -0.39266204833984375, -0.368072509765625, -0.34348297119140625, -0.3188934326171875, -0.29430389404296875, -0.26971435546875, -0.24512481689453125, -0.2205352783203125, -0.19594573974609375, -0.171356201171875, -0.14676666259765625, -0.1221771240234375, -0.09758758544921875, -0.072998046875, -0.04840850830078125, -0.0238189697265625, 0.00077056884765625, 0.025360107421875, 0.04994964599609375, 0.0745391845703125, 0.09912872314453125, 0.12371826171875, 0.14830780029296875, 0.1728973388671875, 0.19748687744140625, 0.222076416015625, 0.24666595458984375, 0.2712554931640625, 0.29584503173828125, 0.3204345703125, 0.34502410888671875, 0.3696136474609375, 0.39420318603515625, 0.418792724609375, 0.44338226318359375, 0.4679718017578125, 0.49256134033203125, 0.51715087890625, 0.5417404174804688, 0.5663299560546875, 0.5909194946289062, 0.615509033203125, 0.6400985717773438, 0.6646881103515625, 0.6892776489257812, 0.7138671875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 7.0, 9.0, 11.0, 18.0, 19.0, 20.0, 23.0, 31.0, 42.0, 37.0, 42.0, 71.0, 64.0, 60.0, 58.0, 66.0, 60.0, 49.0, 45.0, 35.0, 34.0, 24.0, 36.0, 24.0, 26.0, 19.0, 15.0, 12.0, 6.0, 3.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361572265625, -0.3504638671875, -0.33935546875, -0.3282470703125, -0.317138671875, -0.3060302734375, -0.294921875, -0.2838134765625, -0.272705078125, -0.2615966796875, -0.25048828125, -0.2393798828125, -0.228271484375, -0.2171630859375, -0.2060546875, -0.1949462890625, -0.183837890625, -0.1727294921875, -0.16162109375, -0.1505126953125, -0.139404296875, -0.1282958984375, -0.1171875, -0.1060791015625, -0.094970703125, -0.0838623046875, -0.07275390625, -0.0616455078125, -0.050537109375, -0.0394287109375, -0.0283203125, -0.0172119140625, -0.006103515625, 0.0050048828125, 0.01611328125, 0.0272216796875, 0.038330078125, 0.0494384765625, 0.060546875, 0.0716552734375, 0.082763671875, 0.0938720703125, 0.10498046875, 0.1160888671875, 0.127197265625, 0.1383056640625, 0.1494140625, 0.1605224609375, 0.171630859375, 0.1827392578125, 0.19384765625, 0.2049560546875, 0.216064453125, 0.2271728515625, 0.23828125, 0.2493896484375, 0.260498046875, 0.2716064453125, 0.28271484375, 0.2938232421875, 0.304931640625, 0.3160400390625, 0.3271484375, 0.3382568359375, 0.349365234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 10.0, 8.0, 22.0, 20.0, 40.0, 47.0, 66.0, 83.0, 131.0, 211.0, 350.0, 604.0, 1140.0, 2553.0, 7780.0, 47250.0, 2319179.0, 1760310.0, 42195.0, 7201.0, 2410.0, 1094.0, 580.0, 318.0, 229.0, 150.0, 93.0, 51.0, 36.0, 30.0, 19.0, 17.0, 10.0, 8.0, 8.0, 8.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6005859375, -1.5534820556640625, -1.506378173828125, -1.4592742919921875, -1.41217041015625, -1.3650665283203125, -1.317962646484375, -1.2708587646484375, -1.2237548828125, -1.1766510009765625, -1.129547119140625, -1.0824432373046875, -1.03533935546875, -0.9882354736328125, -0.941131591796875, -0.8940277099609375, -0.846923828125, -0.7998199462890625, -0.752716064453125, -0.7056121826171875, -0.65850830078125, -0.6114044189453125, -0.564300537109375, -0.5171966552734375, -0.4700927734375, -0.4229888916015625, -0.375885009765625, -0.3287811279296875, -0.28167724609375, -0.2345733642578125, -0.187469482421875, -0.1403656005859375, -0.09326171875, -0.0461578369140625, 0.000946044921875, 0.0480499267578125, 0.09515380859375, 0.1422576904296875, 0.189361572265625, 0.2364654541015625, 0.2835693359375, 0.3306732177734375, 0.377777099609375, 0.4248809814453125, 0.47198486328125, 0.5190887451171875, 0.566192626953125, 0.6132965087890625, 0.660400390625, 0.7075042724609375, 0.754608154296875, 0.8017120361328125, 0.84881591796875, 0.8959197998046875, 0.943023681640625, 0.9901275634765625, 1.0372314453125, 1.0843353271484375, 1.131439208984375, 1.1785430908203125, 1.22564697265625, 1.2727508544921875, 1.319854736328125, 1.3669586181640625, 1.4140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 5.0, 9.0, 12.0, 15.0, 13.0, 33.0, 48.0, 61.0, 80.0, 120.0, 179.0, 229.0, 337.0, 468.0, 558.0, 558.0, 407.0, 276.0, 209.0, 149.0, 92.0, 67.0, 44.0, 34.0, 21.0, 16.0, 11.0, 10.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4072265625, -1.3709259033203125, -1.334625244140625, -1.2983245849609375, -1.26202392578125, -1.2257232666015625, -1.189422607421875, -1.1531219482421875, -1.1168212890625, -1.0805206298828125, -1.044219970703125, -1.0079193115234375, -0.97161865234375, -0.9353179931640625, -0.899017333984375, -0.8627166748046875, -0.826416015625, -0.7901153564453125, -0.753814697265625, -0.7175140380859375, -0.68121337890625, -0.6449127197265625, -0.608612060546875, -0.5723114013671875, -0.5360107421875, -0.4997100830078125, -0.463409423828125, -0.4271087646484375, -0.39080810546875, -0.3545074462890625, -0.318206787109375, -0.2819061279296875, -0.24560546875, -0.2093048095703125, -0.173004150390625, -0.1367034912109375, -0.10040283203125, -0.0641021728515625, -0.027801513671875, 0.0084991455078125, 0.0447998046875, 0.0811004638671875, 0.117401123046875, 0.1537017822265625, 0.19000244140625, 0.2263031005859375, 0.262603759765625, 0.2989044189453125, 0.335205078125, 0.3715057373046875, 0.407806396484375, 0.4441070556640625, 0.48040771484375, 0.5167083740234375, 0.553009033203125, 0.5893096923828125, 0.6256103515625, 0.6619110107421875, 0.698211669921875, 0.7345123291015625, 0.77081298828125, 0.8071136474609375, 0.843414306640625, 0.8797149658203125, 0.916015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 8.0, 14.0, 30.0, 56.0, 112.0, 232.0, 262.0, 143.0, 76.0, 26.0, 15.0, 7.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.248767852783203, -19.638607025146484, -19.028446197509766, -18.418283462524414, -17.808122634887695, -17.197961807250977, -16.587799072265625, -15.977638244628906, -15.367477416992188, -14.757316589355469, -14.147154808044434, -13.536993026733398, -12.92683219909668, -12.316671371459961, -11.706509590148926, -11.09634780883789, -10.486186981201172, -9.876026153564453, -9.265864372253418, -8.655702590942383, -8.045541763305664, -7.435380458831787, -6.82521915435791, -6.215057849884033, -5.604896545410156, -4.994735240936279, -4.384573936462402, -3.7744126319885254, -3.1642513275146484, -2.5540900230407715, -1.9439287185668945, -1.3337674140930176, -0.7236080169677734, -0.11344671249389648, 0.49671459197998047, 1.1068758964538574, 1.7170372009277344, 2.3271985054016113, 2.9373598098754883, 3.5475211143493652, 4.157682418823242, 4.767843723297119, 5.378005027770996, 5.988166332244873, 6.59832763671875, 7.208488941192627, 7.818650245666504, 8.428812026977539, 9.038972854614258, 9.649133682250977, 10.259295463562012, 10.869457244873047, 11.479618072509766, 12.089778900146484, 12.69994068145752, 13.310102462768555, 13.920263290405273, 14.530424118041992, 15.140585899353027, 15.750747680664062, 16.36090850830078, 16.9710693359375, 17.58123016357422, 18.19139289855957, 18.80155372619629]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 5.0, 5.0, 13.0, 11.0, 14.0, 14.0, 20.0, 27.0, 20.0, 22.0, 26.0, 28.0, 31.0, 26.0, 32.0, 32.0, 34.0, 57.0, 64.0, 70.0, 43.0, 42.0, 50.0, 32.0, 32.0, 30.0, 34.0, 25.0, 34.0, 25.0, 14.0, 15.0, 19.0, 8.0, 8.0, 8.0, 5.0, 4.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.119375228881836, -5.936121940612793, -5.752869129180908, -5.569616317749023, -5.3863630294799805, -5.2031097412109375, -5.019856929779053, -4.836604118347168, -4.653350830078125, -4.470097541809082, -4.286844730377197, -4.1035919189453125, -3.9203386306762695, -3.7370855808258057, -3.553832530975342, -3.370579481124878, -3.187326431274414, -3.00407338142395, -2.8208203315734863, -2.6375672817230225, -2.4543142318725586, -2.2710611820220947, -2.087808132171631, -1.904555082321167, -1.7213020324707031, -1.5380489826202393, -1.3547959327697754, -1.1715428829193115, -0.9882898330688477, -0.8050367832183838, -0.6217837333679199, -0.43853068351745605, -0.2552781105041504, -0.07202506065368652, 0.11122798919677734, 0.2944810390472412, 0.4777340888977051, 0.660987138748169, 0.8442401885986328, 1.0274932384490967, 1.2107462882995605, 1.3939993381500244, 1.5772523880004883, 1.7605054378509521, 1.943758487701416, 2.12701153755188, 2.3102645874023438, 2.4935176372528076, 2.6767706871032715, 2.8600237369537354, 3.043276786804199, 3.226529836654663, 3.409782886505127, 3.593035936355591, 3.7762889862060547, 3.9595420360565186, 4.142795085906982, 4.326047897338867, 4.50930118560791, 4.692554473876953, 4.875807285308838, 5.059060096740723, 5.242313385009766, 5.425566673278809, 5.608819484710693]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 8.0, 10.0, 14.0, 13.0, 9.0, 20.0, 35.0, 52.0, 86.0, 142.0, 243.0, 395.0, 704.0, 1478.0, 3029.0, 7000.0, 18730.0, 63785.0, 359880.0, 481678.0, 75037.0, 21450.0, 7862.0, 3395.0, 1578.0, 795.0, 425.0, 254.0, 145.0, 99.0, 53.0, 26.0, 27.0, 21.0, 19.0, 6.0, 9.0, 15.0, 3.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.72216796875, -0.7009658813476562, -0.6797637939453125, -0.6585617065429688, -0.637359619140625, -0.6161575317382812, -0.5949554443359375, -0.5737533569335938, -0.55255126953125, -0.5313491821289062, -0.5101470947265625, -0.48894500732421875, -0.467742919921875, -0.44654083251953125, -0.4253387451171875, -0.40413665771484375, -0.3829345703125, -0.36173248291015625, -0.3405303955078125, -0.31932830810546875, -0.298126220703125, -0.27692413330078125, -0.2557220458984375, -0.23451995849609375, -0.21331787109375, -0.19211578369140625, -0.1709136962890625, -0.14971160888671875, -0.128509521484375, -0.10730743408203125, -0.0861053466796875, -0.06490325927734375, -0.043701171875, -0.02249908447265625, -0.0012969970703125, 0.01990509033203125, 0.041107177734375, 0.06230926513671875, 0.0835113525390625, 0.10471343994140625, 0.12591552734375, 0.14711761474609375, 0.1683197021484375, 0.18952178955078125, 0.210723876953125, 0.23192596435546875, 0.2531280517578125, 0.27433013916015625, 0.2955322265625, 0.31673431396484375, 0.3379364013671875, 0.35913848876953125, 0.380340576171875, 0.40154266357421875, 0.4227447509765625, 0.44394683837890625, 0.46514892578125, 0.48635101318359375, 0.5075531005859375, 0.5287551879882812, 0.549957275390625, 0.5711593627929688, 0.5923614501953125, 0.6135635375976562, 0.634765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 13.0, 9.0, 13.0, 19.0, 18.0, 21.0, 28.0, 33.0, 41.0, 45.0, 57.0, 56.0, 64.0, 55.0, 65.0, 71.0, 54.0, 42.0, 49.0, 38.0, 37.0, 30.0, 35.0, 18.0, 13.0, 13.0, 12.0, 8.0, 9.0, 5.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.462158203125, -0.4486351013183594, -0.43511199951171875, -0.4215888977050781, -0.4080657958984375, -0.3945426940917969, -0.38101959228515625, -0.3674964904785156, -0.353973388671875, -0.3404502868652344, -0.32692718505859375, -0.3134040832519531, -0.2998809814453125, -0.2863578796386719, -0.27283477783203125, -0.2593116760253906, -0.24578857421875, -0.23226547241210938, -0.21874237060546875, -0.20521926879882812, -0.1916961669921875, -0.17817306518554688, -0.16464996337890625, -0.15112686157226562, -0.137603759765625, -0.12408065795898438, -0.11055755615234375, -0.09703445434570312, -0.0835113525390625, -0.06998825073242188, -0.05646514892578125, -0.042942047119140625, -0.0294189453125, -0.015895843505859375, -0.00237274169921875, 0.011150360107421875, 0.0246734619140625, 0.038196563720703125, 0.05171966552734375, 0.06524276733398438, 0.078765869140625, 0.09228897094726562, 0.10581207275390625, 0.11933517456054688, 0.1328582763671875, 0.14638137817382812, 0.15990447998046875, 0.17342758178710938, 0.18695068359375, 0.20047378540039062, 0.21399688720703125, 0.22751998901367188, 0.2410430908203125, 0.2545661926269531, 0.26808929443359375, 0.2816123962402344, 0.295135498046875, 0.3086585998535156, 0.32218170166015625, 0.3357048034667969, 0.3492279052734375, 0.3627510070800781, 0.37627410888671875, 0.3897972106933594, 0.4033203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 8.0, 5.0, 3.0, 8.0, 14.0, 19.0, 21.0, 29.0, 54.0, 81.0, 134.0, 192.0, 310.0, 609.0, 1378.0, 4693.0, 31372.0, 882322.0, 112405.0, 10606.0, 2242.0, 838.0, 444.0, 253.0, 162.0, 110.0, 85.0, 46.0, 29.0, 33.0, 21.0, 10.0, 5.0, 6.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0], "bins": [-1.2197265625, -1.187408447265625, -1.15509033203125, -1.122772216796875, -1.0904541015625, -1.058135986328125, -1.02581787109375, -0.993499755859375, -0.961181640625, -0.928863525390625, -0.89654541015625, -0.864227294921875, -0.8319091796875, -0.799591064453125, -0.76727294921875, -0.734954833984375, -0.70263671875, -0.670318603515625, -0.63800048828125, -0.605682373046875, -0.5733642578125, -0.541046142578125, -0.50872802734375, -0.476409912109375, -0.444091796875, -0.411773681640625, -0.37945556640625, -0.347137451171875, -0.3148193359375, -0.282501220703125, -0.25018310546875, -0.217864990234375, -0.185546875, -0.153228759765625, -0.12091064453125, -0.088592529296875, -0.0562744140625, -0.023956298828125, 0.00836181640625, 0.040679931640625, 0.072998046875, 0.105316162109375, 0.13763427734375, 0.169952392578125, 0.2022705078125, 0.234588623046875, 0.26690673828125, 0.299224853515625, 0.33154296875, 0.363861083984375, 0.39617919921875, 0.428497314453125, 0.4608154296875, 0.493133544921875, 0.52545166015625, 0.557769775390625, 0.590087890625, 0.622406005859375, 0.65472412109375, 0.687042236328125, 0.7193603515625, 0.751678466796875, 0.78399658203125, 0.816314697265625, 0.8486328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 7.0, 11.0, 7.0, 13.0, 14.0, 17.0, 20.0, 36.0, 29.0, 44.0, 42.0, 53.0, 84.0, 82.0, 98.0, 83.0, 68.0, 42.0, 38.0, 28.0, 26.0, 24.0, 19.0, 18.0, 14.0, 12.0, 10.0, 12.0, 5.0, 10.0, 7.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8505859375, -1.7966461181640625, -1.742706298828125, -1.6887664794921875, -1.63482666015625, -1.5808868408203125, -1.526947021484375, -1.4730072021484375, -1.4190673828125, -1.3651275634765625, -1.311187744140625, -1.2572479248046875, -1.20330810546875, -1.1493682861328125, -1.095428466796875, -1.0414886474609375, -0.987548828125, -0.9336090087890625, -0.879669189453125, -0.8257293701171875, -0.77178955078125, -0.7178497314453125, -0.663909912109375, -0.6099700927734375, -0.5560302734375, -0.5020904541015625, -0.448150634765625, -0.3942108154296875, -0.34027099609375, -0.2863311767578125, -0.232391357421875, -0.1784515380859375, -0.12451171875, -0.0705718994140625, -0.016632080078125, 0.0373077392578125, 0.09124755859375, 0.1451873779296875, 0.199127197265625, 0.2530670166015625, 0.3070068359375, 0.3609466552734375, 0.414886474609375, 0.4688262939453125, 0.52276611328125, 0.5767059326171875, 0.630645751953125, 0.6845855712890625, 0.738525390625, 0.7924652099609375, 0.846405029296875, 0.9003448486328125, 0.95428466796875, 1.0082244873046875, 1.062164306640625, 1.1161041259765625, 1.1700439453125, 1.2239837646484375, 1.277923583984375, 1.3318634033203125, 1.38580322265625, 1.4397430419921875, 1.493682861328125, 1.5476226806640625, 1.6015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 20.0, 18.0, 30.0, 40.0, 78.0, 142.0, 287.0, 682.0, 1837.0, 6790.0, 41730.0, 905192.0, 77254.0, 10406.0, 2546.0, 788.0, 299.0, 154.0, 86.0, 54.0, 26.0, 17.0, 17.0, 10.0, 11.0, 9.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.187744140625, -0.1821613311767578, -0.17657852172851562, -0.17099571228027344, -0.16541290283203125, -0.15983009338378906, -0.15424728393554688, -0.1486644744873047, -0.1430816650390625, -0.1374988555908203, -0.13191604614257812, -0.12633323669433594, -0.12075042724609375, -0.11516761779785156, -0.10958480834960938, -0.10400199890136719, -0.098419189453125, -0.09283638000488281, -0.08725357055664062, -0.08167076110839844, -0.07608795166015625, -0.07050514221191406, -0.06492233276367188, -0.05933952331542969, -0.0537567138671875, -0.04817390441894531, -0.042591094970703125, -0.03700828552246094, -0.03142547607421875, -0.025842666625976562, -0.020259857177734375, -0.014677047729492188, -0.00909423828125, -0.0035114288330078125, 0.002071380615234375, 0.0076541900634765625, 0.01323699951171875, 0.018819808959960938, 0.024402618408203125, 0.029985427856445312, 0.0355682373046875, 0.04115104675292969, 0.046733856201171875, 0.05231666564941406, 0.05789947509765625, 0.06348228454589844, 0.06906509399414062, 0.07464790344238281, 0.080230712890625, 0.08581352233886719, 0.09139633178710938, 0.09697914123535156, 0.10256195068359375, 0.10814476013183594, 0.11372756958007812, 0.11931037902832031, 0.1248931884765625, 0.1304759979248047, 0.13605880737304688, 0.14164161682128906, 0.14722442626953125, 0.15280723571777344, 0.15839004516601562, 0.1639728546142578, 0.1695556640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 3.0, 8.0, 11.0, 10.0, 10.0, 15.0, 18.0, 28.0, 26.0, 29.0, 49.0, 72.0, 88.0, 120.0, 109.0, 99.0, 71.0, 57.0, 43.0, 32.0, 27.0, 15.0, 16.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93986701965332e-05, -3.812834620475769e-05, -3.685802221298218e-05, -3.5587698221206665e-05, -3.431737422943115e-05, -3.304705023765564e-05, -3.177672624588013e-05, -3.0506402254104614e-05, -2.92360782623291e-05, -2.796575427055359e-05, -2.6695430278778076e-05, -2.5425106287002563e-05, -2.415478229522705e-05, -2.2884458303451538e-05, -2.1614134311676025e-05, -2.0343810319900513e-05, -1.9073486328125e-05, -1.7803162336349487e-05, -1.6532838344573975e-05, -1.5262514352798462e-05, -1.399219036102295e-05, -1.2721866369247437e-05, -1.1451542377471924e-05, -1.0181218385696411e-05, -8.910894393920898e-06, -7.640570402145386e-06, -6.370246410369873e-06, -5.09992241859436e-06, -3.829598426818848e-06, -2.559274435043335e-06, -1.2889504432678223e-06, -1.862645149230957e-08, 1.2516975402832031e-06, 2.522021532058716e-06, 3.7923455238342285e-06, 5.062669515609741e-06, 6.332993507385254e-06, 7.603317499160767e-06, 8.87364149093628e-06, 1.0143965482711792e-05, 1.1414289474487305e-05, 1.2684613466262817e-05, 1.395493745803833e-05, 1.5225261449813843e-05, 1.6495585441589355e-05, 1.7765909433364868e-05, 1.903623342514038e-05, 2.0306557416915894e-05, 2.1576881408691406e-05, 2.284720540046692e-05, 2.411752939224243e-05, 2.5387853384017944e-05, 2.6658177375793457e-05, 2.792850136756897e-05, 2.9198825359344482e-05, 3.0469149351119995e-05, 3.173947334289551e-05, 3.300979733467102e-05, 3.428012132644653e-05, 3.5550445318222046e-05, 3.682076930999756e-05, 3.809109330177307e-05, 3.9361417293548584e-05, 4.06317412853241e-05, 4.190206527709961e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 6.0, 9.0, 9.0, 16.0, 11.0, 24.0, 28.0, 48.0, 46.0, 78.0, 129.0, 195.0, 307.0, 474.0, 739.0, 1350.0, 2488.0, 5260.0, 12045.0, 35909.0, 198063.0, 717550.0, 46552.0, 14540.0, 5928.0, 2897.0, 1513.0, 874.0, 502.0, 303.0, 211.0, 143.0, 104.0, 56.0, 37.0, 21.0, 28.0, 21.0, 15.0, 7.0, 9.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0936279296875, -0.09051704406738281, -0.08740615844726562, -0.08429527282714844, -0.08118438720703125, -0.07807350158691406, -0.07496261596679688, -0.07185173034667969, -0.0687408447265625, -0.06562995910644531, -0.06251907348632812, -0.05940818786621094, -0.05629730224609375, -0.05318641662597656, -0.050075531005859375, -0.04696464538574219, -0.043853759765625, -0.04074287414550781, -0.037631988525390625, -0.03452110290527344, -0.03141021728515625, -0.028299331665039062, -0.025188446044921875, -0.022077560424804688, -0.0189666748046875, -0.015855789184570312, -0.012744903564453125, -0.009634017944335938, -0.00652313232421875, -0.0034122467041015625, -0.000301361083984375, 0.0028095245361328125, 0.00592041015625, 0.009031295776367188, 0.012142181396484375, 0.015253067016601562, 0.01836395263671875, 0.021474838256835938, 0.024585723876953125, 0.027696609497070312, 0.0308074951171875, 0.03391838073730469, 0.037029266357421875, 0.04014015197753906, 0.04325103759765625, 0.04636192321777344, 0.049472808837890625, 0.05258369445800781, 0.055694580078125, 0.05880546569824219, 0.061916351318359375, 0.06502723693847656, 0.06813812255859375, 0.07124900817871094, 0.07435989379882812, 0.07747077941894531, 0.0805816650390625, 0.08369255065917969, 0.08680343627929688, 0.08991432189941406, 0.09302520751953125, 0.09613609313964844, 0.09924697875976562, 0.10235786437988281, 0.10546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 2.0, 8.0, 5.0, 13.0, 18.0, 14.0, 21.0, 40.0, 34.0, 63.0, 69.0, 81.0, 101.0, 91.0, 77.0, 72.0, 55.0, 40.0, 34.0, 26.0, 29.0, 21.0, 12.0, 9.0, 13.0, 9.0, 5.0, 4.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1219482421875, -0.11815738677978516, -0.11436653137207031, -0.11057567596435547, -0.10678482055664062, -0.10299396514892578, -0.09920310974121094, -0.0954122543334961, -0.09162139892578125, -0.0878305435180664, -0.08403968811035156, -0.08024883270263672, -0.07645797729492188, -0.07266712188720703, -0.06887626647949219, -0.06508541107177734, -0.0612945556640625, -0.057503700256347656, -0.05371284484863281, -0.04992198944091797, -0.046131134033203125, -0.04234027862548828, -0.03854942321777344, -0.034758567810058594, -0.03096771240234375, -0.027176856994628906, -0.023386001586914062, -0.01959514617919922, -0.015804290771484375, -0.012013435363769531, -0.008222579956054688, -0.004431724548339844, -0.000640869140625, 0.0031499862670898438, 0.0069408416748046875, 0.010731697082519531, 0.014522552490234375, 0.01831340789794922, 0.022104263305664062, 0.025895118713378906, 0.02968597412109375, 0.033476829528808594, 0.03726768493652344, 0.04105854034423828, 0.044849395751953125, 0.04864025115966797, 0.05243110656738281, 0.056221961975097656, 0.0600128173828125, 0.06380367279052734, 0.06759452819824219, 0.07138538360595703, 0.07517623901367188, 0.07896709442138672, 0.08275794982910156, 0.0865488052368164, 0.09033966064453125, 0.0941305160522461, 0.09792137145996094, 0.10171222686767578, 0.10550308227539062, 0.10929393768310547, 0.11308479309082031, 0.11687564849853516, 0.12066650390625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 11.0, 13.0, 22.0, 39.0, 53.0, 88.0, 519.0, 100.0, 67.0, 27.0, 17.0, 21.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364222526550293, -5.18243932723999, -5.0006561279296875, -4.818872451782227, -4.637089252471924, -4.455306053161621, -4.27352237701416, -4.091739177703857, -3.9099559783935547, -3.728172779083252, -3.54638934135437, -3.3646059036254883, -3.1828227043151855, -3.001039505004883, -2.819256067276001, -2.637472629547119, -2.4556894302368164, -2.2739062309265137, -2.092122793197632, -1.9103394746780396, -1.7285561561584473, -1.546772837638855, -1.3649895191192627, -1.1832062005996704, -1.0014228820800781, -0.8196395635604858, -0.6378562450408936, -0.45607292652130127, -0.274289608001709, -0.0925062894821167, 0.08927702903747559, 0.27106034755706787, 0.45284414291381836, 0.6346274614334106, 0.8164107799530029, 0.9981940984725952, 1.1799774169921875, 1.3617607355117798, 1.543544054031372, 1.7253273725509644, 1.9071106910705566, 2.0888938903808594, 2.270677328109741, 2.452460765838623, 2.634243965148926, 2.8160271644592285, 2.9978106021881104, 3.179594039916992, 3.361377239227295, 3.5431604385375977, 3.7249438762664795, 3.9067273139953613, 4.088510513305664, 4.270293712615967, 4.4520769119262695, 4.6338605880737305, 4.815643787384033, 4.997426986694336, 5.179210662841797, 5.3609938621521, 5.542777061462402, 5.724560260772705, 5.906343460083008, 6.088127136230469, 6.2699103355407715]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 6.0, 6.0, 4.0, 7.0, 8.0, 4.0, 8.0, 12.0, 19.0, 18.0, 21.0, 23.0, 26.0, 27.0, 25.0, 38.0, 180.0, 260.0, 83.0, 32.0, 25.0, 14.0, 15.0, 15.0, 12.0, 9.0, 10.0, 19.0, 8.0, 8.0, 10.0, 8.0, 6.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.015302658081055, -3.894341230392456, -3.7733800411224365, -3.652418613433838, -3.5314571857452393, -3.4104957580566406, -3.289534568786621, -3.1685731410980225, -3.047611713409424, -2.926650285720825, -2.8056890964508057, -2.684727668762207, -2.5637662410736084, -2.4428048133850098, -2.3218436241149902, -2.2008821964263916, -2.079921007156372, -1.958959698677063, -1.8379982709884644, -1.7170369625091553, -1.5960755348205566, -1.4751142263412476, -1.3541529178619385, -1.2331914901733398, -1.1122301816940308, -0.9912688136100769, -0.870307445526123, -0.749346137046814, -0.6283847689628601, -0.5074234008789062, -0.38646209239959717, -0.2655007243156433, -0.14453959465026855, -0.02357824146747589, 0.09738311171531677, 0.21834444999694824, 0.3393058180809021, 0.46026718616485596, 0.581228494644165, 0.7021898627281189, 0.8231512308120728, 0.9441125988960266, 1.0650739669799805, 1.1860352754592896, 1.3069965839385986, 1.4279580116271973, 1.5489193201065063, 1.6698806285858154, 1.790842056274414, 1.9118033647537231, 2.0327646732330322, 2.153726100921631, 2.2746875286102295, 2.395648956298828, 2.5166101455688477, 2.6375715732574463, 2.758533000946045, 2.8794944286346436, 3.000455617904663, 3.1214170455932617, 3.2423784732818604, 3.363339900970459, 3.4843010902404785, 3.605262517929077, 3.7262237071990967]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 4.0, 8.0, 10.0, 11.0, 9.0, 11.0, 11.0, 18.0, 21.0, 34.0, 22.0, 27.0, 39.0, 33.0, 37.0, 109.0, 212.0, 85.0, 41.0, 27.0, 14.0, 32.0, 15.0, 25.0, 14.0, 21.0, 12.0, 15.0, 12.0, 13.0, 12.0, 3.0, 4.0, 7.0, 9.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.28076171875, -0.2715034484863281, -0.26224517822265625, -0.2529869079589844, -0.2437286376953125, -0.23447036743164062, -0.22521209716796875, -0.21595382690429688, -0.206695556640625, -0.19743728637695312, -0.18817901611328125, -0.17892074584960938, -0.1696624755859375, -0.16040420532226562, -0.15114593505859375, -0.14188766479492188, -0.13262939453125, -0.12337112426757812, -0.11411285400390625, -0.10485458374023438, -0.0955963134765625, -0.08633804321289062, -0.07707977294921875, -0.06782150268554688, -0.058563232421875, -0.049304962158203125, -0.04004669189453125, -0.030788421630859375, -0.0215301513671875, -0.012271881103515625, -0.00301361083984375, 0.006244659423828125, 0.0155029296875, 0.024761199951171875, 0.03401947021484375, 0.043277740478515625, 0.0525360107421875, 0.061794281005859375, 0.07105255126953125, 0.08031082153320312, 0.089569091796875, 0.09882736206054688, 0.10808563232421875, 0.11734390258789062, 0.1266021728515625, 0.13586044311523438, 0.14511871337890625, 0.15437698364257812, 0.16363525390625, 0.17289352416992188, 0.18215179443359375, 0.19141006469726562, 0.2006683349609375, 0.20992660522460938, 0.21918487548828125, 0.22844314575195312, 0.237701416015625, 0.24695968627929688, 0.25621795654296875, 0.2654762268066406, 0.2747344970703125, 0.2839927673339844, 0.29325103759765625, 0.3025093078613281, 0.311767578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 12.0, 15.0, 21.0, 27.0, 70.0, 214.0, 1587.0, 91547.0, 8292478.0, 2144.0, 262.0, 79.0, 56.0, 33.0, 15.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.132739067077637, -7.870877742767334, -7.609016418457031, -7.34715461730957, -7.085293292999268, -6.823431968688965, -6.561570167541504, -6.299708843231201, -6.037847518920898, -5.775986194610596, -5.514124870300293, -5.252263069152832, -4.990401744842529, -4.728540420532227, -4.466678619384766, -4.204817295074463, -3.94295597076416, -3.6810946464538574, -3.4192330837249756, -3.1573715209960938, -2.895510196685791, -2.6336488723754883, -2.3717873096466064, -2.1099257469177246, -1.8480644226074219, -1.5862029790878296, -1.3243415355682373, -1.062480092048645, -0.8006186485290527, -0.5387572050094604, -0.27689576148986816, -0.015034317970275879, 0.2468271255493164, 0.5086885690689087, 0.770550012588501, 1.0324114561080933, 1.2942728996276855, 1.5561343431472778, 1.8179957866668701, 2.079857349395752, 2.3417186737060547, 2.6035799980163574, 2.8654415607452393, 3.127303123474121, 3.389164447784424, 3.6510257720947266, 3.9128873348236084, 4.17474889755249, 4.436610221862793, 4.698471546173096, 4.960332870483398, 5.222194671630859, 5.484055995941162, 5.745917320251465, 6.007779121398926, 6.2696404457092285, 6.531501770019531, 6.793363094329834, 7.055224418640137, 7.317086219787598, 7.5789475440979, 7.840808868408203, 8.102670669555664, 8.364531517028809, 8.62639331817627]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 7.0, 3.0, 7.0, 4.0, 5.0, 7.0, 3.0, 3.0, 6.0, 4.0, 4.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.435853958129883, -6.282285213470459, -6.128715991973877, -5.975147247314453, -5.821578025817871, -5.668009281158447, -5.514440536499023, -5.360871315002441, -5.207302570343018, -5.053733825683594, -4.900164604187012, -4.746595859527588, -4.593026638031006, -4.439457893371582, -4.285888671875, -4.132319927215576, -3.9787509441375732, -3.8251819610595703, -3.6716129779815674, -3.5180439949035645, -3.3644752502441406, -3.2109062671661377, -3.0573372840881348, -2.903768539428711, -2.750199317932129, -2.596630334854126, -2.443061351776123, -2.289492607116699, -2.1359236240386963, -1.9823546409606934, -1.8287856578826904, -1.675216794013977, -1.5216476917266846, -1.3680787086486816, -1.2145098447799683, -1.0609408617019653, -0.9073719382286072, -0.753803014755249, -0.6002340316772461, -0.4466651678085327, -0.2930961847305298, -0.13952724635601044, 0.014041692018508911, 0.16761064529418945, 0.3211795687675476, 0.47474849224090576, 0.6283174753189087, 0.7818863391876221, 0.935455322265625, 1.089024305343628, 1.2425931692123413, 1.3961621522903442, 1.5497310161590576, 1.7032999992370605, 1.8568689823150635, 2.0104379653930664, 2.1640067100524902, 2.317575693130493, 2.471144676208496, 2.62471342086792, 2.778282403945923, 2.931851387023926, 3.0854203701019287, 3.2389893531799316, 3.3925583362579346]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 11.0, 17.0, 15.0, 24.0, 31.0, 60.0, 72.0, 108.0, 164.0, 298.0, 611.0, 2132.0, 10046.0, 60171.0, 295552.0, 129081.0, 19904.0, 3834.0, 1032.0, 447.0, 179.0, 134.0, 96.0, 54.0, 56.0, 28.0, 23.0, 22.0, 16.0, 9.0, 6.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.69921875, -5.5194091796875, -5.339599609375, -5.1597900390625, -4.97998046875, -4.8001708984375, -4.620361328125, -4.4405517578125, -4.2607421875, -4.0809326171875, -3.901123046875, -3.7213134765625, -3.54150390625, -3.3616943359375, -3.181884765625, -3.0020751953125, -2.822265625, -2.6424560546875, -2.462646484375, -2.2828369140625, -2.10302734375, -1.9232177734375, -1.743408203125, -1.5635986328125, -1.3837890625, -1.2039794921875, -1.024169921875, -0.8443603515625, -0.66455078125, -0.4847412109375, -0.304931640625, -0.1251220703125, 0.0546875, 0.2344970703125, 0.414306640625, 0.5941162109375, 0.77392578125, 0.9537353515625, 1.133544921875, 1.3133544921875, 1.4931640625, 1.6729736328125, 1.852783203125, 2.0325927734375, 2.21240234375, 2.3922119140625, 2.572021484375, 2.7518310546875, 2.931640625, 3.1114501953125, 3.291259765625, 3.4710693359375, 3.65087890625, 3.8306884765625, 4.010498046875, 4.1903076171875, 4.3701171875, 4.5499267578125, 4.729736328125, 4.9095458984375, 5.08935546875, 5.2691650390625, 5.448974609375, 5.6287841796875, 5.80859375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 4.0, 10.0, 7.0, 13.0, 12.0, 10.0, 22.0, 20.0, 34.0, 45.0, 45.0, 42.0, 61.0, 74.0, 65.0, 85.0, 63.0, 54.0, 59.0, 45.0, 41.0, 46.0, 31.0, 24.0, 16.0, 14.0, 14.0, 7.0, 8.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.470458984375, -0.4566993713378906, -0.44293975830078125, -0.4291801452636719, -0.4154205322265625, -0.4016609191894531, -0.38790130615234375, -0.3741416931152344, -0.360382080078125, -0.3466224670410156, -0.33286285400390625, -0.3191032409667969, -0.3053436279296875, -0.2915840148925781, -0.27782440185546875, -0.2640647888183594, -0.25030517578125, -0.23654556274414062, -0.22278594970703125, -0.20902633666992188, -0.1952667236328125, -0.18150711059570312, -0.16774749755859375, -0.15398788452148438, -0.140228271484375, -0.12646865844726562, -0.11270904541015625, -0.09894943237304688, -0.0851898193359375, -0.07143020629882812, -0.05767059326171875, -0.043910980224609375, -0.0301513671875, -0.016391754150390625, -0.00263214111328125, 0.011127471923828125, 0.0248870849609375, 0.038646697998046875, 0.05240631103515625, 0.06616592407226562, 0.079925537109375, 0.09368515014648438, 0.10744476318359375, 0.12120437622070312, 0.1349639892578125, 0.14872360229492188, 0.16248321533203125, 0.17624282836914062, 0.19000244140625, 0.20376205444335938, 0.21752166748046875, 0.23128128051757812, 0.2450408935546875, 0.2588005065917969, 0.27256011962890625, 0.2863197326660156, 0.300079345703125, 0.3138389587402344, 0.32759857177734375, 0.3413581848144531, 0.3551177978515625, 0.3688774108886719, 0.38263702392578125, 0.3963966369628906, 0.41015625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 2.0, 11.0, 10.0, 30.0, 62.0, 91.0, 93.0, 69.0, 46.0, 21.0, 10.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9703562259674072, -2.837705612182617, -2.7050552368164062, -2.5724048614501953, -2.4397542476654053, -2.3071036338806152, -2.1744532585144043, -2.0418028831481934, -1.9091522693634033, -1.7765017747879028, -1.6438512802124023, -1.5112007856369019, -1.3785502910614014, -1.2458997964859009, -1.1132493019104004, -0.9805988073348999, -0.8479483127593994, -0.7152978181838989, -0.5826473236083984, -0.44999682903289795, -0.31734633445739746, -0.18469583988189697, -0.052045345306396484, 0.080605149269104, 0.2132556438446045, 0.345906138420105, 0.47855663299560547, 0.611207127571106, 0.7438576221466064, 0.8765081167221069, 1.0091586112976074, 1.141809105873108, 1.2744593620300293, 1.4071098566055298, 1.5397603511810303, 1.6724108457565308, 1.8050613403320312, 1.9377118349075317, 2.0703623294830322, 2.2030129432678223, 2.335663318634033, 2.468313694000244, 2.600964307785034, 2.733614921569824, 2.866265296936035, 2.998915672302246, 3.131566286087036, 3.264216899871826, 3.396867275238037, 3.529517650604248, 3.662168264389038, 3.794818878173828, 3.927469253540039, 4.06011962890625, 4.192770004272461, 4.32542085647583, 4.458071231842041, 4.590721607208252, 4.723372459411621, 4.856022834777832, 4.988673210144043, 5.121323585510254, 5.253973960876465, 5.386624813079834, 5.519275188446045]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 7.0, 6.0, 16.0, 35.0, 68.0, 69.0, 82.0, 61.0, 37.0, 15.0, 12.0, 7.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 4.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7188446521759033, -1.6588523387908936, -1.5988600254058838, -1.5388678312301636, -1.4788755178451538, -1.418883204460144, -1.3588908910751343, -1.298898696899414, -1.2389063835144043, -1.1789140701293945, -1.1189217567443848, -1.0589295625686646, -0.9989372491836548, -0.938944935798645, -0.8789526224136353, -0.8189603686332703, -0.7589680552482605, -0.6989757418632507, -0.6389834880828857, -0.578991174697876, -0.518998920917511, -0.4590066075325012, -0.39901432394981384, -0.33902204036712646, -0.2790297567844391, -0.2190374732017517, -0.15904518961906433, -0.09905289113521576, -0.03906060755252838, 0.02093169093132019, 0.08092397451400757, 0.14091625809669495, 0.20090854167938232, 0.2609008252620697, 0.3208931088447571, 0.38088542222976685, 0.44087767601013184, 0.5008699893951416, 0.5608623027801514, 0.6208545565605164, 0.6808468103408813, 0.7408391237258911, 0.8008313775062561, 0.8608236908912659, 0.9208159446716309, 0.9808082580566406, 1.0408005714416504, 1.1007928848266602, 1.16078519821167, 1.2207775115966797, 1.2807698249816895, 1.3407620191574097, 1.4007543325424194, 1.4607466459274292, 1.520738959312439, 1.5807311534881592, 1.640723466873169, 1.7007157802581787, 1.7607080936431885, 1.8207002878189087, 1.8806926012039185, 1.9406849145889282, 2.0006771087646484, 2.060669422149658, 2.120661735534668]}, "train/train_runtime": 4741.9429, "train/train_samples_per_second": 6.018, "train/train_steps_per_second": 0.063, "train/total_flos": 0.0, "train/train_loss": 4.266032724669485} \ No newline at end of file