diff --git "a/wandb/run-20220228_185039-2l3jouo4/files/wandb-summary.json" "b/wandb/run-20220228_185039-2l3jouo4/files/wandb-summary.json" --- "a/wandb/run-20220228_185039-2l3jouo4/files/wandb-summary.json" +++ "b/wandb/run-20220228_185039-2l3jouo4/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.4907, "train/learning_rate": 3.1914893617021275e-07, "train/epoch": 1.0, "train/global_step": 594, "_runtime": 5718, "_timestamp": 1646079957, "_step": 595, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 10.0, 548.0, 448.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.368497848510742, -13.00784683227539, -8.647195816040039, -4.2865447998046875, 0.07410621643066406, 4.434757232666016, 8.795408248901367, 13.156059265136719, 17.51671028137207, 21.877361297607422, 26.238012313842773, 30.598663330078125, 34.959312438964844, 39.31996536254883, 43.68061828613281, 48.04126739501953, 52.40191650390625, 56.76256561279297, 61.12321853637695, 65.48387145996094, 69.84452056884766, 74.20516967773438, 78.56582641601562, 82.92647552490234, 87.28712463378906, 91.64777374267578, 96.0084228515625, 100.36907958984375, 104.72972869873047, 109.09037780761719, 113.45103454589844, 117.81168365478516, 122.17233276367188, 126.5329818725586, 130.8936309814453, 135.25428771972656, 139.61492919921875, 143.9755859375, 148.33624267578125, 152.69688415527344, 157.0575408935547, 161.41819763183594, 165.77883911132812, 170.13949584960938, 174.50015258789062, 178.8607940673828, 183.22145080566406, 187.58209228515625, 191.9427490234375, 196.30340576171875, 200.66404724121094, 205.0247039794922, 209.38534545898438, 213.74600219726562, 218.10665893554688, 222.46730041503906, 226.8279571533203, 231.18861389160156, 235.54925537109375, 239.909912109375, 244.27056884765625, 248.63121032714844, 252.9918670654297, 257.3525085449219, 261.7131652832031]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 11.0, 7.0, 6.0, 16.0, 13.0, 18.0, 20.0, 23.0, 27.0, 29.0, 25.0, 36.0, 44.0, 38.0, 33.0, 30.0, 39.0, 56.0, 53.0, 59.0, 39.0, 36.0, 41.0, 37.0, 33.0, 35.0, 27.0, 23.0, 28.0, 28.0, 21.0, 13.0, 16.0, 5.0, 5.0, 10.0, 4.0, 2.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.572723388671875, -20.85820770263672, -20.143692016601562, -19.429176330566406, -18.71466064453125, -18.00014305114746, -17.285627365112305, -16.57111167907715, -15.856595993041992, -15.142080307006836, -14.42756462097168, -13.713047981262207, -12.99853229522705, -12.284016609191895, -11.569499969482422, -10.854984283447266, -10.14046859741211, -9.425952911376953, -8.711437225341797, -7.996920585632324, -7.282404899597168, -6.567889213562012, -5.853373050689697, -5.138856887817383, -4.424341201782227, -3.709825277328491, -2.995309352874756, -2.2807934284210205, -1.5662775039672852, -0.8517615795135498, -0.13724565505981445, 0.5772705078125, 1.2917861938476562, 2.0063021183013916, 2.720818042755127, 3.4353339672088623, 4.149849891662598, 4.864365577697754, 5.578881740570068, 6.293397903442383, 7.007913589477539, 7.722429275512695, 8.436944961547852, 9.151461601257324, 9.86597728729248, 10.580492973327637, 11.29500961303711, 12.009525299072266, 12.724040985107422, 13.438556671142578, 14.153072357177734, 14.867588996887207, 15.582104682922363, 16.296621322631836, 17.011137008666992, 17.72565269470215, 18.440168380737305, 19.15468406677246, 19.869199752807617, 20.583715438842773, 21.298233032226562, 22.01274871826172, 22.727264404296875, 23.44178009033203, 24.156295776367188]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 3.0, 8.0, 11.0, 10.0, 16.0, 22.0, 17.0, 19.0, 23.0, 36.0, 22.0, 35.0, 33.0, 30.0, 43.0, 39.0, 48.0, 41.0, 45.0, 49.0, 46.0, 42.0, 34.0, 30.0, 45.0, 35.0, 27.0, 33.0, 26.0, 30.0, 17.0, 16.0, 13.0, 6.0, 9.0, 5.0, 9.0, 10.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.1525115966796875, -1.114593505859375, -1.0766754150390625, -1.03875732421875, -1.0008392333984375, -0.962921142578125, -0.9250030517578125, -0.8870849609375, -0.8491668701171875, -0.811248779296875, -0.7733306884765625, -0.73541259765625, -0.6974945068359375, -0.659576416015625, -0.6216583251953125, -0.583740234375, -0.5458221435546875, -0.507904052734375, -0.4699859619140625, -0.43206787109375, -0.3941497802734375, -0.356231689453125, -0.3183135986328125, -0.2803955078125, -0.2424774169921875, -0.204559326171875, -0.1666412353515625, -0.12872314453125, -0.0908050537109375, -0.052886962890625, -0.0149688720703125, 0.02294921875, 0.0608673095703125, 0.098785400390625, 0.1367034912109375, 0.17462158203125, 0.2125396728515625, 0.250457763671875, 0.2883758544921875, 0.3262939453125, 0.3642120361328125, 0.402130126953125, 0.4400482177734375, 0.47796630859375, 0.5158843994140625, 0.553802490234375, 0.5917205810546875, 0.629638671875, 0.6675567626953125, 0.705474853515625, 0.7433929443359375, 0.78131103515625, 0.8192291259765625, 0.857147216796875, 0.8950653076171875, 0.9329833984375, 0.9709014892578125, 1.008819580078125, 1.0467376708984375, 1.08465576171875, 1.1225738525390625, 1.160491943359375, 1.1984100341796875, 1.236328125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 9.0, 9.0, 24.0, 24.0, 33.0, 36.0, 57.0, 95.0, 129.0, 192.0, 308.0, 504.0, 775.0, 1315.0, 2239.0, 4421.0, 11468.0, 39459.0, 231150.0, 2016112.0, 1650216.0, 182969.0, 33397.0, 10070.0, 4090.0, 2023.0, 1151.0, 684.0, 434.0, 304.0, 161.0, 139.0, 71.0, 53.0, 40.0, 27.0, 16.0, 17.0, 9.0, 9.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-3.978515625, -3.861297607421875, -3.74407958984375, -3.626861572265625, -3.5096435546875, -3.392425537109375, -3.27520751953125, -3.157989501953125, -3.040771484375, -2.923553466796875, -2.80633544921875, -2.689117431640625, -2.5718994140625, -2.454681396484375, -2.33746337890625, -2.220245361328125, -2.10302734375, -1.985809326171875, -1.86859130859375, -1.751373291015625, -1.6341552734375, -1.516937255859375, -1.39971923828125, -1.282501220703125, -1.165283203125, -1.048065185546875, -0.93084716796875, -0.813629150390625, -0.6964111328125, -0.579193115234375, -0.46197509765625, -0.344757080078125, -0.2275390625, -0.110321044921875, 0.00689697265625, 0.124114990234375, 0.2413330078125, 0.358551025390625, 0.47576904296875, 0.592987060546875, 0.710205078125, 0.827423095703125, 0.94464111328125, 1.061859130859375, 1.1790771484375, 1.296295166015625, 1.41351318359375, 1.530731201171875, 1.64794921875, 1.765167236328125, 1.88238525390625, 1.999603271484375, 2.1168212890625, 2.234039306640625, 2.35125732421875, 2.468475341796875, 2.585693359375, 2.702911376953125, 2.82012939453125, 2.937347412109375, 3.0545654296875, 3.171783447265625, 3.28900146484375, 3.406219482421875, 3.5234375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 20.0, 42.0, 64.0, 79.0, 143.0, 234.0, 413.0, 711.0, 810.0, 625.0, 349.0, 214.0, 124.0, 92.0, 54.0, 22.0, 21.0, 17.0, 11.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.62384033203125, -7.4078369140625, -7.19183349609375, -6.975830078125, -6.75982666015625, -6.5438232421875, -6.32781982421875, -6.11181640625, -5.89581298828125, -5.6798095703125, -5.46380615234375, -5.247802734375, -5.03179931640625, -4.8157958984375, -4.59979248046875, -4.3837890625, -4.16778564453125, -3.9517822265625, -3.73577880859375, -3.519775390625, -3.30377197265625, -3.0877685546875, -2.87176513671875, -2.65576171875, -2.43975830078125, -2.2237548828125, -2.00775146484375, -1.791748046875, -1.57574462890625, -1.3597412109375, -1.14373779296875, -0.927734375, -0.71173095703125, -0.4957275390625, -0.27972412109375, -0.063720703125, 0.15228271484375, 0.3682861328125, 0.58428955078125, 0.80029296875, 1.01629638671875, 1.2322998046875, 1.44830322265625, 1.664306640625, 1.88031005859375, 2.0963134765625, 2.31231689453125, 2.5283203125, 2.74432373046875, 2.9603271484375, 3.17633056640625, 3.392333984375, 3.60833740234375, 3.8243408203125, 4.04034423828125, 4.25634765625, 4.47235107421875, 4.6883544921875, 4.90435791015625, 5.120361328125, 5.33636474609375, 5.5523681640625, 5.76837158203125, 5.984375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 6.0, 18.0, 21.0, 35.0, 81.0, 168.0, 287.0, 534.0, 1220.0, 3921.0, 70392.0, 4064315.0, 47327.0, 3595.0, 1183.0, 491.0, 299.0, 137.0, 85.0, 63.0, 28.0, 18.0, 7.0, 8.0, 8.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.046875, -22.358154296875, -21.66943359375, -20.980712890625, -20.2919921875, -19.603271484375, -18.91455078125, -18.225830078125, -17.537109375, -16.848388671875, -16.15966796875, -15.470947265625, -14.7822265625, -14.093505859375, -13.40478515625, -12.716064453125, -12.02734375, -11.338623046875, -10.64990234375, -9.961181640625, -9.2724609375, -8.583740234375, -7.89501953125, -7.206298828125, -6.517578125, -5.828857421875, -5.14013671875, -4.451416015625, -3.7626953125, -3.073974609375, -2.38525390625, -1.696533203125, -1.0078125, -0.319091796875, 0.36962890625, 1.058349609375, 1.7470703125, 2.435791015625, 3.12451171875, 3.813232421875, 4.501953125, 5.190673828125, 5.87939453125, 6.568115234375, 7.2568359375, 7.945556640625, 8.63427734375, 9.322998046875, 10.01171875, 10.700439453125, 11.38916015625, 12.077880859375, 12.7666015625, 13.455322265625, 14.14404296875, 14.832763671875, 15.521484375, 16.210205078125, 16.89892578125, 17.587646484375, 18.2763671875, 18.965087890625, 19.65380859375, 20.342529296875, 21.03125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 294.0, 709.0, 10.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.29066467285156, -224.8906707763672, -220.4906768798828, -216.09068298339844, -211.69068908691406, -207.2906951904297, -202.8907012939453, -198.49069213867188, -194.0906982421875, -189.69070434570312, -185.29071044921875, -180.89071655273438, -176.49072265625, -172.09072875976562, -167.69073486328125, -163.29074096679688, -158.8907470703125, -154.49075317382812, -150.09075927734375, -145.69076538085938, -141.290771484375, -136.89077758789062, -132.49078369140625, -128.09078979492188, -123.69078826904297, -119.2907943725586, -114.89080047607422, -110.49080657958984, -106.09080505371094, -101.69081115722656, -97.29081726074219, -92.89082336425781, -88.49083709716797, -84.0908432006836, -79.69084930419922, -75.29085540771484, -70.89085388183594, -66.49085998535156, -62.09086608886719, -57.69087219238281, -53.29087829589844, -48.89088439941406, -44.49089050292969, -40.09089279174805, -35.69089889526367, -31.290904998779297, -26.89090919494629, -22.49091339111328, -18.090919494628906, -13.690924644470215, -9.290929794311523, -4.890934944152832, -0.4909400939941406, 3.9090538024902344, 8.309049606323242, 12.70904541015625, 17.109039306640625, 21.509033203125, 25.909029006958008, 30.309024810791016, 34.70901870727539, 39.109012603759766, 43.509010314941406, 47.90900421142578, 52.308998107910156]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 10.0, 6.0, 6.0, 14.0, 15.0, 15.0, 26.0, 29.0, 35.0, 34.0, 42.0, 38.0, 39.0, 54.0, 38.0, 63.0, 40.0, 40.0, 52.0, 53.0, 38.0, 40.0, 48.0, 33.0, 21.0, 27.0, 22.0, 18.0, 18.0, 21.0, 11.0, 9.0, 6.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.034442901611328, -19.45001220703125, -18.865581512451172, -18.281150817871094, -17.696720123291016, -17.11229133605957, -16.527860641479492, -15.943429946899414, -15.358999252319336, -14.774568557739258, -14.19013786315918, -13.605708122253418, -13.02127742767334, -12.436846733093262, -11.8524169921875, -11.267986297607422, -10.683555603027344, -10.099124908447266, -9.514694213867188, -8.930264472961426, -8.345833778381348, -7.7614030838012695, -7.17697286605835, -6.59254264831543, -6.008111953735352, -5.423681259155273, -4.8392510414123535, -4.254820823669434, -3.6703901290893555, -3.0859596729278564, -2.5015292167663574, -1.9170989990234375, -1.3326702117919922, -0.7482397556304932, -0.16380929946899414, 0.4206211566925049, 1.005051612854004, 1.589482069015503, 2.173912525177002, 2.758342742919922, 3.3427734375, 3.927203893661499, 4.511634349822998, 5.096064567565918, 5.680495262145996, 6.264925956726074, 6.849356174468994, 7.433786392211914, 8.018217086791992, 8.60264778137207, 9.187078475952148, 9.77150821685791, 10.355938911437988, 10.940369606018066, 11.524799346923828, 12.109230041503906, 12.693660736083984, 13.278091430664062, 13.86252212524414, 14.446951866149902, 15.03138256072998, 15.615813255310059, 16.20024299621582, 16.7846736907959, 17.369104385375977]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 11.0, 5.0, 7.0, 10.0, 11.0, 6.0, 12.0, 18.0, 21.0, 13.0, 23.0, 20.0, 24.0, 29.0, 31.0, 27.0, 27.0, 33.0, 26.0, 34.0, 34.0, 44.0, 45.0, 47.0, 45.0, 32.0, 33.0, 23.0, 33.0, 25.0, 33.0, 25.0, 27.0, 22.0, 18.0, 24.0, 20.0, 11.0, 14.0, 10.0, 10.0, 12.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.032379150390625, -0.99835205078125, -0.964324951171875, -0.9302978515625, -0.896270751953125, -0.86224365234375, -0.828216552734375, -0.794189453125, -0.760162353515625, -0.72613525390625, -0.692108154296875, -0.6580810546875, -0.624053955078125, -0.59002685546875, -0.555999755859375, -0.52197265625, -0.487945556640625, -0.45391845703125, -0.419891357421875, -0.3858642578125, -0.351837158203125, -0.31781005859375, -0.283782958984375, -0.249755859375, -0.215728759765625, -0.18170166015625, -0.147674560546875, -0.1136474609375, -0.079620361328125, -0.04559326171875, -0.011566162109375, 0.0224609375, 0.056488037109375, 0.09051513671875, 0.124542236328125, 0.1585693359375, 0.192596435546875, 0.22662353515625, 0.260650634765625, 0.294677734375, 0.328704833984375, 0.36273193359375, 0.396759033203125, 0.4307861328125, 0.464813232421875, 0.49884033203125, 0.532867431640625, 0.56689453125, 0.600921630859375, 0.63494873046875, 0.668975830078125, 0.7030029296875, 0.737030029296875, 0.77105712890625, 0.805084228515625, 0.839111328125, 0.873138427734375, 0.90716552734375, 0.941192626953125, 0.9752197265625, 1.009246826171875, 1.04327392578125, 1.077301025390625, 1.111328125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 11.0, 24.0, 24.0, 25.0, 50.0, 86.0, 137.0, 213.0, 302.0, 403.0, 732.0, 1084.0, 1653.0, 2619.0, 4081.0, 6619.0, 10496.0, 17099.0, 27926.0, 45922.0, 78847.0, 149047.0, 323990.0, 165198.0, 84497.0, 49332.0, 29557.0, 18126.0, 11362.0, 6977.0, 4440.0, 2777.0, 1726.0, 1103.0, 729.0, 455.0, 319.0, 174.0, 112.0, 90.0, 57.0, 44.0, 21.0, 19.0, 17.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2437744140625, -0.23628807067871094, -0.22880172729492188, -0.2213153839111328, -0.21382904052734375, -0.2063426971435547, -0.19885635375976562, -0.19137001037597656, -0.1838836669921875, -0.17639732360839844, -0.16891098022460938, -0.1614246368408203, -0.15393829345703125, -0.1464519500732422, -0.13896560668945312, -0.13147926330566406, -0.123992919921875, -0.11650657653808594, -0.10902023315429688, -0.10153388977050781, -0.09404754638671875, -0.08656120300292969, -0.07907485961914062, -0.07158851623535156, -0.0641021728515625, -0.05661582946777344, -0.049129486083984375, -0.04164314270019531, -0.03415679931640625, -0.026670455932617188, -0.019184112548828125, -0.011697769165039062, -0.00421142578125, 0.0032749176025390625, 0.010761260986328125, 0.018247604370117188, 0.02573394775390625, 0.03322029113769531, 0.040706634521484375, 0.04819297790527344, 0.0556793212890625, 0.06316566467285156, 0.07065200805664062, 0.07813835144042969, 0.08562469482421875, 0.09311103820800781, 0.10059738159179688, 0.10808372497558594, 0.115570068359375, 0.12305641174316406, 0.13054275512695312, 0.1380290985107422, 0.14551544189453125, 0.1530017852783203, 0.16048812866210938, 0.16797447204589844, 0.1754608154296875, 0.18294715881347656, 0.19043350219726562, 0.1979198455810547, 0.20540618896484375, 0.2128925323486328, 0.22037887573242188, 0.22786521911621094, 0.2353515625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 3.0, 6.0, 6.0, 5.0, 7.0, 8.0, 11.0, 12.0, 16.0, 14.0, 23.0, 32.0, 29.0, 29.0, 26.0, 21.0, 38.0, 31.0, 35.0, 40.0, 44.0, 41.0, 1065.0, 35.0, 35.0, 43.0, 31.0, 38.0, 30.0, 34.0, 22.0, 22.0, 18.0, 29.0, 28.0, 14.0, 13.0, 18.0, 15.0, 10.0, 11.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.72607421875, -0.703216552734375, -0.68035888671875, -0.657501220703125, -0.6346435546875, -0.611785888671875, -0.58892822265625, -0.566070556640625, -0.543212890625, -0.520355224609375, -0.49749755859375, -0.474639892578125, -0.4517822265625, -0.428924560546875, -0.40606689453125, -0.383209228515625, -0.3603515625, -0.337493896484375, -0.31463623046875, -0.291778564453125, -0.2689208984375, -0.246063232421875, -0.22320556640625, -0.200347900390625, -0.177490234375, -0.154632568359375, -0.13177490234375, -0.108917236328125, -0.0860595703125, -0.063201904296875, -0.04034423828125, -0.017486572265625, 0.00537109375, 0.028228759765625, 0.05108642578125, 0.073944091796875, 0.0968017578125, 0.119659423828125, 0.14251708984375, 0.165374755859375, 0.188232421875, 0.211090087890625, 0.23394775390625, 0.256805419921875, 0.2796630859375, 0.302520751953125, 0.32537841796875, 0.348236083984375, 0.37109375, 0.393951416015625, 0.41680908203125, 0.439666748046875, 0.4625244140625, 0.485382080078125, 0.50823974609375, 0.531097412109375, 0.553955078125, 0.576812744140625, 0.59967041015625, 0.622528076171875, 0.6453857421875, 0.668243408203125, 0.69110107421875, 0.713958740234375, 0.73681640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 12.0, 19.0, 34.0, 51.0, 71.0, 83.0, 133.0, 169.0, 292.0, 432.0, 528.0, 813.0, 1101.0, 1715.0, 2372.0, 3365.0, 5158.0, 7405.0, 10987.0, 16247.0, 24782.0, 39352.0, 63459.0, 112377.0, 1253693.0, 263974.0, 111353.0, 63116.0, 38834.0, 24805.0, 16195.0, 10821.0, 7183.0, 4971.0, 3420.0, 2335.0, 1677.0, 1175.0, 764.0, 542.0, 415.0, 300.0, 191.0, 108.0, 92.0, 73.0, 40.0, 38.0, 20.0, 6.0, 13.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.194580078125, -0.18849754333496094, -0.18241500854492188, -0.1763324737548828, -0.17024993896484375, -0.1641674041748047, -0.15808486938476562, -0.15200233459472656, -0.1459197998046875, -0.13983726501464844, -0.13375473022460938, -0.1276721954345703, -0.12158966064453125, -0.11550712585449219, -0.10942459106445312, -0.10334205627441406, -0.097259521484375, -0.09117698669433594, -0.08509445190429688, -0.07901191711425781, -0.07292938232421875, -0.06684684753417969, -0.060764312744140625, -0.05468177795410156, -0.0485992431640625, -0.04251670837402344, -0.036434173583984375, -0.030351638793945312, -0.02426910400390625, -0.018186569213867188, -0.012104034423828125, -0.0060214996337890625, 6.103515625e-05, 0.0061435699462890625, 0.012226104736328125, 0.018308639526367188, 0.02439117431640625, 0.030473709106445312, 0.036556243896484375, 0.04263877868652344, 0.0487213134765625, 0.05480384826660156, 0.060886383056640625, 0.06696891784667969, 0.07305145263671875, 0.07913398742675781, 0.08521652221679688, 0.09129905700683594, 0.097381591796875, 0.10346412658691406, 0.10954666137695312, 0.11562919616699219, 0.12171173095703125, 0.1277942657470703, 0.13387680053710938, 0.13995933532714844, 0.1460418701171875, 0.15212440490722656, 0.15820693969726562, 0.1642894744873047, 0.17037200927734375, 0.1764545440673828, 0.18253707885742188, 0.18861961364746094, 0.1947021484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 21.0, 28.0, 35.0, 57.0, 67.0, 86.0, 110.0, 125.0, 110.0, 99.0, 74.0, 56.0, 39.0, 30.0, 12.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002193450927734375, -0.00021141767501831055, -0.0002034902572631836, -0.00019556283950805664, -0.0001876354217529297, -0.00017970800399780273, -0.00017178058624267578, -0.00016385316848754883, -0.00015592575073242188, -0.00014799833297729492, -0.00014007091522216797, -0.00013214349746704102, -0.00012421607971191406, -0.00011628866195678711, -0.00010836124420166016, -0.0001004338264465332, -9.250640869140625e-05, -8.45789909362793e-05, -7.665157318115234e-05, -6.872415542602539e-05, -6.079673767089844e-05, -5.2869319915771484e-05, -4.494190216064453e-05, -3.701448440551758e-05, -2.9087066650390625e-05, -2.1159648895263672e-05, -1.3232231140136719e-05, -5.304813385009766e-06, 2.6226043701171875e-06, 1.055002212524414e-05, 1.8477439880371094e-05, 2.6404857635498047e-05, 3.4332275390625e-05, 4.225969314575195e-05, 5.0187110900878906e-05, 5.811452865600586e-05, 6.604194641113281e-05, 7.396936416625977e-05, 8.189678192138672e-05, 8.982419967651367e-05, 9.775161743164062e-05, 0.00010567903518676758, 0.00011360645294189453, 0.00012153387069702148, 0.00012946128845214844, 0.0001373887062072754, 0.00014531612396240234, 0.0001532435417175293, 0.00016117095947265625, 0.0001690983772277832, 0.00017702579498291016, 0.0001849532127380371, 0.00019288063049316406, 0.00020080804824829102, 0.00020873546600341797, 0.00021666288375854492, 0.00022459030151367188, 0.00023251771926879883, 0.00024044513702392578, 0.00024837255477905273, 0.0002562999725341797, 0.00026422739028930664, 0.0002721548080444336, 0.00028008222579956055, 0.0002880096435546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 8.0, 9.0, 11.0, 16.0, 31.0, 39.0, 73.0, 113.0, 195.0, 287.0, 619.0, 2068.0, 1042181.0, 1615.0, 552.0, 292.0, 177.0, 100.0, 71.0, 37.0, 16.0, 21.0, 13.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004764556884765625, -0.0046176910400390625, -0.0044708251953125, -0.0043239593505859375, -0.004177093505859375, -0.0040302276611328125, -0.00388336181640625, -0.0037364959716796875, -0.003589630126953125, -0.0034427642822265625, -0.0032958984375, -0.0031490325927734375, -0.003002166748046875, -0.0028553009033203125, -0.00270843505859375, -0.0025615692138671875, -0.002414703369140625, -0.0022678375244140625, -0.0021209716796875, -0.0019741058349609375, -0.001827239990234375, -0.0016803741455078125, -0.00153350830078125, -0.0013866424560546875, -0.001239776611328125, -0.0010929107666015625, -0.000946044921875, -0.0007991790771484375, -0.000652313232421875, -0.0005054473876953125, -0.00035858154296875, -0.0002117156982421875, -6.4849853515625e-05, 8.20159912109375e-05, 0.0002288818359375, 0.0003757476806640625, 0.000522613525390625, 0.0006694793701171875, 0.00081634521484375, 0.0009632110595703125, 0.001110076904296875, 0.0012569427490234375, 0.00140380859375, 0.0015506744384765625, 0.001697540283203125, 0.0018444061279296875, 0.00199127197265625, 0.0021381378173828125, 0.002285003662109375, 0.0024318695068359375, 0.0025787353515625, 0.0027256011962890625, 0.002872467041015625, 0.0030193328857421875, 0.00316619873046875, 0.0033130645751953125, 0.003459930419921875, 0.0036067962646484375, 0.003753662109375, 0.0039005279541015625, 0.004047393798828125, 0.0041942596435546875, 0.00434112548828125, 0.0044879913330078125, 0.004634857177734375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 16.0, 303.0, 585.0, 105.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00050628453027457, -0.0004960133810527623, -0.000485742260934785, -0.0004754711117129773, -0.00046519996249116957, -0.0004549288423731923, -0.0004446576931513846, -0.0004343865439295769, -0.00042411539470776916, -0.00041384424548596144, -0.0004035731253679842, -0.00039330197614617646, -0.00038303082692436874, -0.0003727597068063915, -0.00036248855758458376, -0.00035221740836277604, -0.0003419462882447988, -0.00033167513902299106, -0.0003214040189050138, -0.0003111328696832061, -0.00030086172046139836, -0.00029059057123959064, -0.0002803194511216134, -0.00027004830189980567, -0.0002597771817818284, -0.0002495060325600207, -0.0002392348978901282, -0.0002289637632202357, -0.000218692613998428, -0.0002084214793285355, -0.000198150344658643, -0.0001878791954368353, -0.00017760807531885803, -0.00016733694064896554, -0.00015706579142715782, -0.00014679465675726533, -0.0001365235075354576, -0.00012625237286556512, -0.00011598123819567263, -0.00010571009624982253, -9.543895430397242e-05, -8.516781235812232e-05, -7.489667041227221e-05, -6.462553574237972e-05, -5.435439379652962e-05, -4.408325185067952e-05, -3.381211718078703e-05, -2.3540975234936923e-05, -1.3269833289086819e-05, -2.998693162226118e-06, 7.272446964634582e-06, 1.754358527250588e-05, 2.7814727218355983e-05, 3.808586916420609e-05, 4.835700383409858e-05, 5.862814577994868e-05, 6.889928772579879e-05, 7.917042967164889e-05, 8.9441571617499e-05, 9.971270628739148e-05, 0.00010998384823324159, 0.00012025499017909169, 0.00013052612484898418, 0.00014079725951887667, 0.0001510684087406844]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 9.0, 8.0, 13.0, 19.0, 21.0, 16.0, 18.0, 19.0, 29.0, 37.0, 24.0, 35.0, 30.0, 53.0, 46.0, 35.0, 43.0, 42.0, 33.0, 40.0, 47.0, 52.0, 35.0, 40.0, 26.0, 26.0, 35.0, 30.0, 25.0, 21.0, 18.0, 12.0, 12.0, 7.0, 6.0, 11.0, 4.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.325410842895508e-05, -7.086247205734253e-05, -6.847083568572998e-05, -6.607919931411743e-05, -6.368756294250488e-05, -6.129592657089233e-05, -5.8904290199279785e-05, -5.6512653827667236e-05, -5.412101745605469e-05, -5.172938108444214e-05, -4.933774471282959e-05, -4.694610834121704e-05, -4.455447196960449e-05, -4.216283559799194e-05, -3.9771199226379395e-05, -3.7379562854766846e-05, -3.49879264831543e-05, -3.259629011154175e-05, -3.02046537399292e-05, -2.781301736831665e-05, -2.54213809967041e-05, -2.3029744625091553e-05, -2.0638108253479004e-05, -1.8246471881866455e-05, -1.5854835510253906e-05, -1.3463199138641357e-05, -1.1071562767028809e-05, -8.67992639541626e-06, -6.288290023803711e-06, -3.896653652191162e-06, -1.5050172805786133e-06, 8.866190910339355e-07, 3.2782554626464844e-06, 5.669891834259033e-06, 8.061528205871582e-06, 1.0453164577484131e-05, 1.284480094909668e-05, 1.5236437320709229e-05, 1.7628073692321777e-05, 2.0019710063934326e-05, 2.2411346435546875e-05, 2.4802982807159424e-05, 2.7194619178771973e-05, 2.958625555038452e-05, 3.197789192199707e-05, 3.436952829360962e-05, 3.676116466522217e-05, 3.915280103683472e-05, 4.1544437408447266e-05, 4.3936073780059814e-05, 4.632771015167236e-05, 4.871934652328491e-05, 5.111098289489746e-05, 5.350261926651001e-05, 5.589425563812256e-05, 5.828589200973511e-05, 6.0677528381347656e-05, 6.30691647529602e-05, 6.546080112457275e-05, 6.78524374961853e-05, 7.024407386779785e-05, 7.26357102394104e-05, 7.502734661102295e-05, 7.74189829826355e-05, 7.981061935424805e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 11.0, 5.0, 7.0, 10.0, 11.0, 6.0, 12.0, 18.0, 21.0, 13.0, 23.0, 20.0, 24.0, 29.0, 31.0, 27.0, 27.0, 33.0, 26.0, 34.0, 34.0, 44.0, 45.0, 47.0, 45.0, 32.0, 33.0, 23.0, 33.0, 25.0, 33.0, 25.0, 27.0, 22.0, 18.0, 24.0, 20.0, 11.0, 14.0, 10.0, 10.0, 12.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.032379150390625, -0.99835205078125, -0.964324951171875, -0.9302978515625, -0.896270751953125, -0.86224365234375, -0.828216552734375, -0.794189453125, -0.760162353515625, -0.72613525390625, -0.692108154296875, -0.6580810546875, -0.624053955078125, -0.59002685546875, -0.555999755859375, -0.52197265625, -0.487945556640625, -0.45391845703125, -0.419891357421875, -0.3858642578125, -0.351837158203125, -0.31781005859375, -0.283782958984375, -0.249755859375, -0.215728759765625, -0.18170166015625, -0.147674560546875, -0.1136474609375, -0.079620361328125, -0.04559326171875, -0.011566162109375, 0.0224609375, 0.056488037109375, 0.09051513671875, 0.124542236328125, 0.1585693359375, 0.192596435546875, 0.22662353515625, 0.260650634765625, 0.294677734375, 0.328704833984375, 0.36273193359375, 0.396759033203125, 0.4307861328125, 0.464813232421875, 0.49884033203125, 0.532867431640625, 0.56689453125, 0.600921630859375, 0.63494873046875, 0.668975830078125, 0.7030029296875, 0.737030029296875, 0.77105712890625, 0.805084228515625, 0.839111328125, 0.873138427734375, 0.90716552734375, 0.941192626953125, 0.9752197265625, 1.009246826171875, 1.04327392578125, 1.077301025390625, 1.111328125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 4.0, 9.0, 11.0, 21.0, 27.0, 37.0, 45.0, 73.0, 88.0, 110.0, 171.0, 270.0, 334.0, 519.0, 719.0, 1083.0, 1663.0, 2503.0, 4059.0, 7399.0, 17489.0, 70645.0, 506436.0, 354813.0, 48849.0, 14066.0, 6385.0, 3654.0, 2283.0, 1491.0, 957.0, 718.0, 507.0, 319.0, 196.0, 162.0, 125.0, 80.0, 74.0, 47.0, 29.0, 20.0, 13.0, 11.0, 10.0, 10.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.953125, -4.79278564453125, -4.6324462890625, -4.47210693359375, -4.311767578125, -4.15142822265625, -3.9910888671875, -3.83074951171875, -3.67041015625, -3.51007080078125, -3.3497314453125, -3.18939208984375, -3.029052734375, -2.86871337890625, -2.7083740234375, -2.54803466796875, -2.3876953125, -2.22735595703125, -2.0670166015625, -1.90667724609375, -1.746337890625, -1.58599853515625, -1.4256591796875, -1.26531982421875, -1.10498046875, -0.94464111328125, -0.7843017578125, -0.62396240234375, -0.463623046875, -0.30328369140625, -0.1429443359375, 0.01739501953125, 0.177734375, 0.33807373046875, 0.4984130859375, 0.65875244140625, 0.819091796875, 0.97943115234375, 1.1397705078125, 1.30010986328125, 1.46044921875, 1.62078857421875, 1.7811279296875, 1.94146728515625, 2.101806640625, 2.26214599609375, 2.4224853515625, 2.58282470703125, 2.7431640625, 2.90350341796875, 3.0638427734375, 3.22418212890625, 3.384521484375, 3.54486083984375, 3.7052001953125, 3.86553955078125, 4.02587890625, 4.18621826171875, 4.3465576171875, 4.50689697265625, 4.667236328125, 4.82757568359375, 4.9879150390625, 5.14825439453125, 5.30859375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 2.0, 3.0, 4.0, 11.0, 7.0, 8.0, 15.0, 13.0, 16.0, 18.0, 19.0, 20.0, 26.0, 18.0, 28.0, 24.0, 47.0, 38.0, 41.0, 68.0, 104.0, 239.0, 1374.0, 266.0, 128.0, 80.0, 39.0, 46.0, 37.0, 51.0, 27.0, 24.0, 31.0, 30.0, 29.0, 19.0, 13.0, 18.0, 15.0, 13.0, 9.0, 8.0, 3.0, 0.0, 6.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.6875, -3.580596923828125, -3.47369384765625, -3.366790771484375, -3.2598876953125, -3.152984619140625, -3.04608154296875, -2.939178466796875, -2.832275390625, -2.725372314453125, -2.61846923828125, -2.511566162109375, -2.4046630859375, -2.297760009765625, -2.19085693359375, -2.083953857421875, -1.97705078125, -1.870147705078125, -1.76324462890625, -1.656341552734375, -1.5494384765625, -1.442535400390625, -1.33563232421875, -1.228729248046875, -1.121826171875, -1.014923095703125, -0.90802001953125, -0.801116943359375, -0.6942138671875, -0.587310791015625, -0.48040771484375, -0.373504638671875, -0.2666015625, -0.159698486328125, -0.05279541015625, 0.054107666015625, 0.1610107421875, 0.267913818359375, 0.37481689453125, 0.481719970703125, 0.588623046875, 0.695526123046875, 0.80242919921875, 0.909332275390625, 1.0162353515625, 1.123138427734375, 1.23004150390625, 1.336944580078125, 1.44384765625, 1.550750732421875, 1.65765380859375, 1.764556884765625, 1.8714599609375, 1.978363037109375, 2.08526611328125, 2.192169189453125, 2.299072265625, 2.405975341796875, 2.51287841796875, 2.619781494140625, 2.7266845703125, 2.833587646484375, 2.94049072265625, 3.047393798828125, 3.154296875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 8.0, 8.0, 12.0, 11.0, 13.0, 18.0, 26.0, 18.0, 34.0, 35.0, 39.0, 59.0, 87.0, 118.0, 233.0, 451.0, 1447.0, 31931.0, 3073544.0, 35047.0, 1408.0, 469.0, 224.0, 127.0, 66.0, 54.0, 28.0, 27.0, 27.0, 20.0, 26.0, 14.0, 10.0, 8.0, 9.0, 8.0, 7.0, 4.0, 2.0, 4.0, 8.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.515625, -12.07666015625, -11.6376953125, -11.19873046875, -10.759765625, -10.32080078125, -9.8818359375, -9.44287109375, -9.00390625, -8.56494140625, -8.1259765625, -7.68701171875, -7.248046875, -6.80908203125, -6.3701171875, -5.93115234375, -5.4921875, -5.05322265625, -4.6142578125, -4.17529296875, -3.736328125, -3.29736328125, -2.8583984375, -2.41943359375, -1.98046875, -1.54150390625, -1.1025390625, -0.66357421875, -0.224609375, 0.21435546875, 0.6533203125, 1.09228515625, 1.53125, 1.97021484375, 2.4091796875, 2.84814453125, 3.287109375, 3.72607421875, 4.1650390625, 4.60400390625, 5.04296875, 5.48193359375, 5.9208984375, 6.35986328125, 6.798828125, 7.23779296875, 7.6767578125, 8.11572265625, 8.5546875, 8.99365234375, 9.4326171875, 9.87158203125, 10.310546875, 10.74951171875, 11.1884765625, 11.62744140625, 12.06640625, 12.50537109375, 12.9443359375, 13.38330078125, 13.822265625, 14.26123046875, 14.7001953125, 15.13916015625, 15.578125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 960.0, 56.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.90650177001953, -50.222145080566406, -44.53778839111328, -38.853431701660156, -33.16907501220703, -27.48472023010254, -21.800365447998047, -16.116008758544922, -10.431652069091797, -4.74729585647583, 0.9370603561401367, 6.621416091918945, 12.30577278137207, 17.990129470825195, 23.674484252929688, 29.358840942382812, 35.04319763183594, 40.72755432128906, 46.41191101074219, 52.09626770019531, 57.78062438964844, 63.46498107910156, 69.14933776855469, 74.83369445800781, 80.51805114746094, 86.20240783691406, 91.88676452636719, 97.57112121582031, 103.25547790527344, 108.93983459472656, 114.62419128417969, 120.30854797363281, 125.99290466308594, 131.67726135253906, 137.3616180419922, 143.0459747314453, 148.73033142089844, 154.41468811035156, 160.0990447998047, 165.7834014892578, 171.46775817871094, 177.15211486816406, 182.8364715576172, 188.5208282470703, 194.20518493652344, 199.88954162597656, 205.5738983154297, 211.2582550048828, 216.94259643554688, 222.626953125, 228.31130981445312, 233.99566650390625, 239.68002319335938, 245.3643798828125, 251.04873657226562, 256.73309326171875, 262.4174499511719, 268.101806640625, 273.7861633300781, 279.47052001953125, 285.1548767089844, 290.8392333984375, 296.5235900878906, 302.20794677734375, 307.8923034667969]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 9.0, 3.0, 4.0, 16.0, 16.0, 9.0, 23.0, 25.0, 15.0, 32.0, 31.0, 39.0, 36.0, 38.0, 23.0, 49.0, 56.0, 42.0, 45.0, 47.0, 28.0, 32.0, 42.0, 41.0, 33.0, 35.0, 29.0, 22.0, 25.0, 11.0, 23.0, 18.0, 8.0, 24.0, 13.0, 8.0, 13.0, 2.0, 5.0, 8.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.243245124816895, -10.839468955993652, -10.43569278717041, -10.031916618347168, -9.628141403198242, -9.224365234375, -8.820589065551758, -8.416812896728516, -8.013036727905273, -7.609260559082031, -7.205484390258789, -6.801708698272705, -6.397932529449463, -5.994156360626221, -5.590380668640137, -5.1866044998168945, -4.782828330993652, -4.37905216217041, -3.975276231765747, -3.571500301361084, -3.167724132537842, -2.7639479637145996, -2.3601720333099365, -1.9563961029052734, -1.5526199340820312, -1.1488438844680786, -0.745067834854126, -0.34129178524017334, 0.0624842643737793, 0.4662604331970215, 0.8700363636016846, 1.2738122940063477, 1.6775875091552734, 2.0813636779785156, 2.4851396083831787, 2.888915538787842, 3.292691707611084, 3.696467876434326, 4.10024356842041, 4.504019737243652, 4.9077959060668945, 5.311572074890137, 5.715348243713379, 6.119123935699463, 6.522900104522705, 6.926676273345947, 7.330451965332031, 7.734228134155273, 8.138004302978516, 8.541780471801758, 8.945556640625, 9.349332809448242, 9.753108978271484, 10.156885147094727, 10.560660362243652, 10.964436531066895, 11.368212699890137, 11.771988868713379, 12.175765037536621, 12.579541206359863, 12.983316421508789, 13.387092590332031, 13.790868759155273, 14.194644927978516, 14.598421096801758]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 15.0, 6.0, 12.0, 14.0, 8.0, 18.0, 16.0, 19.0, 20.0, 26.0, 32.0, 22.0, 24.0, 29.0, 27.0, 25.0, 24.0, 41.0, 44.0, 48.0, 39.0, 45.0, 34.0, 43.0, 26.0, 28.0, 34.0, 26.0, 29.0, 22.0, 30.0, 30.0, 21.0, 18.0, 9.0, 14.0, 15.0, 20.0, 10.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.2529296875, -1.21636962890625, -1.1798095703125, -1.14324951171875, -1.106689453125, -1.07012939453125, -1.0335693359375, -0.99700927734375, -0.96044921875, -0.92388916015625, -0.8873291015625, -0.85076904296875, -0.814208984375, -0.77764892578125, -0.7410888671875, -0.70452880859375, -0.66796875, -0.63140869140625, -0.5948486328125, -0.55828857421875, -0.521728515625, -0.48516845703125, -0.4486083984375, -0.41204833984375, -0.37548828125, -0.33892822265625, -0.3023681640625, -0.26580810546875, -0.229248046875, -0.19268798828125, -0.1561279296875, -0.11956787109375, -0.0830078125, -0.04644775390625, -0.0098876953125, 0.02667236328125, 0.063232421875, 0.09979248046875, 0.1363525390625, 0.17291259765625, 0.20947265625, 0.24603271484375, 0.2825927734375, 0.31915283203125, 0.355712890625, 0.39227294921875, 0.4288330078125, 0.46539306640625, 0.501953125, 0.53851318359375, 0.5750732421875, 0.61163330078125, 0.648193359375, 0.68475341796875, 0.7213134765625, 0.75787353515625, 0.79443359375, 0.83099365234375, 0.8675537109375, 0.90411376953125, 0.940673828125, 0.97723388671875, 1.0137939453125, 1.05035400390625, 1.0869140625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 24.0, 30.0, 36.0, 52.0, 57.0, 83.0, 103.0, 152.0, 242.0, 359.0, 511.0, 827.0, 1439.0, 2827.0, 6366.0, 17360.0, 66136.0, 514416.0, 2859697.0, 617148.0, 73559.0, 18923.0, 6806.0, 3008.0, 1502.0, 908.0, 507.0, 353.0, 229.0, 174.0, 109.0, 74.0, 63.0, 42.0, 35.0, 24.0, 12.0, 17.0, 11.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.0390625, -4.8887939453125, -4.738525390625, -4.5882568359375, -4.43798828125, -4.2877197265625, -4.137451171875, -3.9871826171875, -3.8369140625, -3.6866455078125, -3.536376953125, -3.3861083984375, -3.23583984375, -3.0855712890625, -2.935302734375, -2.7850341796875, -2.634765625, -2.4844970703125, -2.334228515625, -2.1839599609375, -2.03369140625, -1.8834228515625, -1.733154296875, -1.5828857421875, -1.4326171875, -1.2823486328125, -1.132080078125, -0.9818115234375, -0.83154296875, -0.6812744140625, -0.531005859375, -0.3807373046875, -0.23046875, -0.0802001953125, 0.070068359375, 0.2203369140625, 0.37060546875, 0.5208740234375, 0.671142578125, 0.8214111328125, 0.9716796875, 1.1219482421875, 1.272216796875, 1.4224853515625, 1.57275390625, 1.7230224609375, 1.873291015625, 2.0235595703125, 2.173828125, 2.3240966796875, 2.474365234375, 2.6246337890625, 2.77490234375, 2.9251708984375, 3.075439453125, 3.2257080078125, 3.3759765625, 3.5262451171875, 3.676513671875, 3.8267822265625, 3.97705078125, 4.1273193359375, 4.277587890625, 4.4278564453125, 4.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 10.0, 3.0, 18.0, 17.0, 46.0, 78.0, 125.0, 169.0, 311.0, 493.0, 590.0, 711.0, 511.0, 339.0, 231.0, 157.0, 112.0, 64.0, 33.0, 21.0, 22.0, 6.0, 4.0, 3.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.86236572265625, -8.6466064453125, -8.43084716796875, -8.215087890625, -7.99932861328125, -7.7835693359375, -7.56781005859375, -7.35205078125, -7.13629150390625, -6.9205322265625, -6.70477294921875, -6.489013671875, -6.27325439453125, -6.0574951171875, -5.84173583984375, -5.6259765625, -5.41021728515625, -5.1944580078125, -4.97869873046875, -4.762939453125, -4.54718017578125, -4.3314208984375, -4.11566162109375, -3.89990234375, -3.68414306640625, -3.4683837890625, -3.25262451171875, -3.036865234375, -2.82110595703125, -2.6053466796875, -2.38958740234375, -2.173828125, -1.95806884765625, -1.7423095703125, -1.52655029296875, -1.310791015625, -1.09503173828125, -0.8792724609375, -0.66351318359375, -0.44775390625, -0.23199462890625, -0.0162353515625, 0.19952392578125, 0.415283203125, 0.63104248046875, 0.8468017578125, 1.06256103515625, 1.2783203125, 1.49407958984375, 1.7098388671875, 1.92559814453125, 2.141357421875, 2.35711669921875, 2.5728759765625, 2.78863525390625, 3.00439453125, 3.22015380859375, 3.4359130859375, 3.65167236328125, 3.867431640625, 4.08319091796875, 4.2989501953125, 4.51470947265625, 4.73046875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [5.0, 4.0, 12.0, 13.0, 10.0, 25.0, 56.0, 73.0, 113.0, 192.0, 535.0, 2456.0, 449861.0, 3734267.0, 5573.0, 676.0, 218.0, 99.0, 53.0, 19.0, 20.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5625, -10.68359375, -9.8046875, -8.92578125, -8.046875, -7.16796875, -6.2890625, -5.41015625, -4.53125, -3.65234375, -2.7734375, -1.89453125, -1.015625, -0.13671875, 0.7421875, 1.62109375, 2.5, 3.37890625, 4.2578125, 5.13671875, 6.015625, 6.89453125, 7.7734375, 8.65234375, 9.53125, 10.41015625, 11.2890625, 12.16796875, 13.046875, 13.92578125, 14.8046875, 15.68359375, 16.5625, 17.44140625, 18.3203125, 19.19921875, 20.078125, 20.95703125, 21.8359375, 22.71484375, 23.59375, 24.47265625, 25.3515625, 26.23046875, 27.109375, 27.98828125, 28.8671875, 29.74609375, 30.625, 31.50390625, 32.3828125, 33.26171875, 34.140625, 35.01953125, 35.8984375, 36.77734375, 37.65625, 38.53515625, 39.4140625, 40.29296875, 41.171875, 42.05078125, 42.9296875, 43.80859375, 44.6875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 770.0, 245.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.78044128417969, -51.89575958251953, -46.01108169555664, -40.12640380859375, -34.241722106933594, -28.35704231262207, -22.472362518310547, -16.587684631347656, -10.7030029296875, -4.818323135375977, 1.0663566589355469, 6.95103645324707, 12.835716247558594, 18.720396041870117, 24.60507583618164, 30.48975372314453, 36.37443542480469, 42.259117126464844, 48.143795013427734, 54.028472900390625, 59.91315460205078, 65.79783630371094, 71.68251037597656, 77.56719207763672, 83.45187377929688, 89.33655548095703, 95.22123718261719, 101.10591125488281, 106.99059295654297, 112.87527465820312, 118.75994873046875, 124.6446304321289, 130.529296875, 136.41397094726562, 142.2986602783203, 148.18333435058594, 154.06802368164062, 159.95269775390625, 165.83737182617188, 171.7220458984375, 177.6067352294922, 183.4914093017578, 189.3760986328125, 195.26077270507812, 201.14544677734375, 207.03013610839844, 212.91481018066406, 218.79949951171875, 224.68417358398438, 230.56884765625, 236.4535369873047, 242.3382110595703, 248.222900390625, 254.10757446289062, 259.99224853515625, 265.8769226074219, 271.7615966796875, 277.6462707519531, 283.53094482421875, 289.4156494140625, 295.3003234863281, 301.18499755859375, 307.0696716308594, 312.954345703125, 318.83905029296875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 7.0, 16.0, 8.0, 15.0, 19.0, 24.0, 19.0, 23.0, 30.0, 34.0, 32.0, 36.0, 44.0, 37.0, 35.0, 48.0, 48.0, 43.0, 51.0, 43.0, 48.0, 50.0, 34.0, 39.0, 32.0, 29.0, 35.0, 20.0, 10.0, 19.0, 13.0, 9.0, 9.0, 8.0, 8.0, 7.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-23.02631378173828, -22.363508224487305, -21.700700759887695, -21.03789520263672, -20.37508773803711, -19.712282180786133, -19.049474716186523, -18.386669158935547, -17.723861694335938, -17.06105613708496, -16.39824867248535, -15.735442161560059, -15.072635650634766, -14.409830093383789, -13.747023582458496, -13.084217071533203, -12.421411514282227, -11.758605003356934, -11.09579849243164, -10.432991981506348, -9.770185470581055, -9.107379913330078, -8.444573402404785, -7.781766891479492, -7.118960380554199, -6.456153869628906, -5.793347358703613, -5.1305413246154785, -4.4677348136901855, -3.8049283027648926, -3.1421220302581787, -2.479315757751465, -1.8165092468261719, -1.1537028551101685, -0.49089646339416504, 0.17190992832183838, 0.8347163200378418, 1.4975228309631348, 2.1603291034698486, 2.8231353759765625, 3.4859418869018555, 4.148748397827148, 4.811554908752441, 5.474360942840576, 6.137167453765869, 6.799973964691162, 7.462779998779297, 8.12558650970459, 8.788393020629883, 9.451199531555176, 10.114006042480469, 10.776812553405762, 11.439619064331055, 12.102424621582031, 12.765231132507324, 13.428037643432617, 14.09084415435791, 14.753650665283203, 15.416457176208496, 16.07926368713379, 16.742069244384766, 17.404876708984375, 18.06768226623535, 18.730487823486328, 19.393295288085938]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 9.0, 8.0, 15.0, 19.0, 15.0, 26.0, 24.0, 29.0, 25.0, 26.0, 24.0, 31.0, 39.0, 38.0, 33.0, 36.0, 37.0, 43.0, 47.0, 37.0, 36.0, 32.0, 37.0, 38.0, 29.0, 24.0, 29.0, 26.0, 19.0, 25.0, 24.0, 26.0, 10.0, 11.0, 7.0, 11.0, 9.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.3779296875, -1.339202880859375, -1.30047607421875, -1.261749267578125, -1.2230224609375, -1.184295654296875, -1.14556884765625, -1.106842041015625, -1.068115234375, -1.029388427734375, -0.99066162109375, -0.951934814453125, -0.9132080078125, -0.874481201171875, -0.83575439453125, -0.797027587890625, -0.75830078125, -0.719573974609375, -0.68084716796875, -0.642120361328125, -0.6033935546875, -0.564666748046875, -0.52593994140625, -0.487213134765625, -0.448486328125, -0.409759521484375, -0.37103271484375, -0.332305908203125, -0.2935791015625, -0.254852294921875, -0.21612548828125, -0.177398681640625, -0.138671875, -0.099945068359375, -0.06121826171875, -0.022491455078125, 0.0162353515625, 0.054962158203125, 0.09368896484375, 0.132415771484375, 0.171142578125, 0.209869384765625, 0.24859619140625, 0.287322998046875, 0.3260498046875, 0.364776611328125, 0.40350341796875, 0.442230224609375, 0.48095703125, 0.519683837890625, 0.55841064453125, 0.597137451171875, 0.6358642578125, 0.674591064453125, 0.71331787109375, 0.752044677734375, 0.790771484375, 0.829498291015625, 0.86822509765625, 0.906951904296875, 0.9456787109375, 0.984405517578125, 1.02313232421875, 1.061859130859375, 1.1005859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 12.0, 17.0, 24.0, 24.0, 39.0, 52.0, 80.0, 112.0, 193.0, 282.0, 465.0, 691.0, 1142.0, 1924.0, 3093.0, 5257.0, 8927.0, 15091.0, 25303.0, 42881.0, 74932.0, 145783.0, 314831.0, 189454.0, 91957.0, 51160.0, 30220.0, 18036.0, 10646.0, 6194.0, 3791.0, 2289.0, 1371.0, 814.0, 464.0, 333.0, 219.0, 155.0, 98.0, 73.0, 44.0, 28.0, 20.0, 10.0, 9.0, 5.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0], "bins": [-0.28564453125, -0.27740478515625, -0.2691650390625, -0.26092529296875, -0.252685546875, -0.24444580078125, -0.2362060546875, -0.22796630859375, -0.2197265625, -0.21148681640625, -0.2032470703125, -0.19500732421875, -0.186767578125, -0.17852783203125, -0.1702880859375, -0.16204833984375, -0.15380859375, -0.14556884765625, -0.1373291015625, -0.12908935546875, -0.120849609375, -0.11260986328125, -0.1043701171875, -0.09613037109375, -0.087890625, -0.07965087890625, -0.0714111328125, -0.06317138671875, -0.054931640625, -0.04669189453125, -0.0384521484375, -0.03021240234375, -0.02197265625, -0.01373291015625, -0.0054931640625, 0.00274658203125, 0.010986328125, 0.01922607421875, 0.0274658203125, 0.03570556640625, 0.0439453125, 0.05218505859375, 0.0604248046875, 0.06866455078125, 0.076904296875, 0.08514404296875, 0.0933837890625, 0.10162353515625, 0.10986328125, 0.11810302734375, 0.1263427734375, 0.13458251953125, 0.142822265625, 0.15106201171875, 0.1593017578125, 0.16754150390625, 0.17578125, 0.18402099609375, 0.1922607421875, 0.20050048828125, 0.208740234375, 0.21697998046875, 0.2252197265625, 0.23345947265625, 0.24169921875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 6.0, 12.0, 12.0, 14.0, 22.0, 12.0, 22.0, 22.0, 33.0, 31.0, 35.0, 44.0, 35.0, 43.0, 38.0, 46.0, 46.0, 1063.0, 47.0, 40.0, 48.0, 38.0, 36.0, 38.0, 24.0, 21.0, 31.0, 33.0, 24.0, 23.0, 13.0, 18.0, 7.0, 8.0, 7.0, 6.0, 4.0, 6.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.830078125, -0.8025436401367188, -0.7750091552734375, -0.7474746704101562, -0.719940185546875, -0.6924057006835938, -0.6648712158203125, -0.6373367309570312, -0.60980224609375, -0.5822677612304688, -0.5547332763671875, -0.5271987915039062, -0.499664306640625, -0.47212982177734375, -0.4445953369140625, -0.41706085205078125, -0.3895263671875, -0.36199188232421875, -0.3344573974609375, -0.30692291259765625, -0.279388427734375, -0.25185394287109375, -0.2243194580078125, -0.19678497314453125, -0.16925048828125, -0.14171600341796875, -0.1141815185546875, -0.08664703369140625, -0.059112548828125, -0.03157806396484375, -0.0040435791015625, 0.02349090576171875, 0.051025390625, 0.07855987548828125, 0.1060943603515625, 0.13362884521484375, 0.161163330078125, 0.18869781494140625, 0.2162322998046875, 0.24376678466796875, 0.27130126953125, 0.29883575439453125, 0.3263702392578125, 0.35390472412109375, 0.381439208984375, 0.40897369384765625, 0.4365081787109375, 0.46404266357421875, 0.4915771484375, 0.5191116333007812, 0.5466461181640625, 0.5741806030273438, 0.601715087890625, 0.6292495727539062, 0.6567840576171875, 0.6843185424804688, 0.71185302734375, 0.7393875122070312, 0.7669219970703125, 0.7944564819335938, 0.821990966796875, 0.8495254516601562, 0.8770599365234375, 0.9045944213867188, 0.93212890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 10.0, 12.0, 14.0, 27.0, 36.0, 58.0, 71.0, 109.0, 165.0, 246.0, 347.0, 516.0, 717.0, 1119.0, 1657.0, 2609.0, 3925.0, 6104.0, 9618.0, 15148.0, 24681.0, 41662.0, 73662.0, 147079.0, 1361971.0, 189366.0, 89605.0, 49602.0, 28669.0, 17219.0, 10838.0, 7004.0, 4461.0, 2947.0, 1915.0, 1246.0, 875.0, 585.0, 381.0, 270.0, 187.0, 135.0, 91.0, 48.0, 44.0, 27.0, 26.0, 12.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23046875, -0.22294998168945312, -0.21543121337890625, -0.20791244506835938, -0.2003936767578125, -0.19287490844726562, -0.18535614013671875, -0.17783737182617188, -0.170318603515625, -0.16279983520507812, -0.15528106689453125, -0.14776229858398438, -0.1402435302734375, -0.13272476196289062, -0.12520599365234375, -0.11768722534179688, -0.11016845703125, -0.10264968872070312, -0.09513092041015625, -0.08761215209960938, -0.0800933837890625, -0.07257461547851562, -0.06505584716796875, -0.057537078857421875, -0.050018310546875, -0.042499542236328125, -0.03498077392578125, -0.027462005615234375, -0.0199432373046875, -0.012424468994140625, -0.00490570068359375, 0.002613067626953125, 0.0101318359375, 0.017650604248046875, 0.02516937255859375, 0.032688140869140625, 0.0402069091796875, 0.047725677490234375, 0.05524444580078125, 0.06276321411132812, 0.070281982421875, 0.07780075073242188, 0.08531951904296875, 0.09283828735351562, 0.1003570556640625, 0.10787582397460938, 0.11539459228515625, 0.12291336059570312, 0.13043212890625, 0.13795089721679688, 0.14546966552734375, 0.15298843383789062, 0.1605072021484375, 0.16802597045898438, 0.17554473876953125, 0.18306350708007812, 0.190582275390625, 0.19810104370117188, 0.20561981201171875, 0.21313858032226562, 0.2206573486328125, 0.22817611694335938, 0.23569488525390625, 0.24321365356445312, 0.250732421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 3.0, 4.0, 2.0, 8.0, 11.0, 17.0, 10.0, 13.0, 19.0, 21.0, 27.0, 24.0, 40.0, 35.0, 39.0, 32.0, 34.0, 42.0, 50.0, 43.0, 40.0, 50.0, 46.0, 50.0, 42.0, 42.0, 37.0, 26.0, 23.0, 29.0, 24.0, 18.0, 13.0, 13.0, 15.0, 13.0, 11.0, 7.0, 5.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.79304313659668e-05, -9.470432996749878e-05, -9.147822856903076e-05, -8.825212717056274e-05, -8.502602577209473e-05, -8.179992437362671e-05, -7.857382297515869e-05, -7.534772157669067e-05, -7.212162017822266e-05, -6.889551877975464e-05, -6.566941738128662e-05, -6.24433159828186e-05, -5.9217214584350586e-05, -5.599111318588257e-05, -5.276501178741455e-05, -4.953891038894653e-05, -4.6312808990478516e-05, -4.30867075920105e-05, -3.986060619354248e-05, -3.663450479507446e-05, -3.3408403396606445e-05, -3.0182301998138428e-05, -2.695620059967041e-05, -2.3730099201202393e-05, -2.0503997802734375e-05, -1.7277896404266357e-05, -1.405179500579834e-05, -1.0825693607330322e-05, -7.599592208862305e-06, -4.373490810394287e-06, -1.1473894119262695e-06, 2.078711986541748e-06, 5.304813385009766e-06, 8.530914783477783e-06, 1.17570161819458e-05, 1.4983117580413818e-05, 1.8209218978881836e-05, 2.1435320377349854e-05, 2.466142177581787e-05, 2.788752317428589e-05, 3.1113624572753906e-05, 3.4339725971221924e-05, 3.756582736968994e-05, 4.079192876815796e-05, 4.4018030166625977e-05, 4.7244131565093994e-05, 5.047023296356201e-05, 5.369633436203003e-05, 5.692243576049805e-05, 6.0148537158966064e-05, 6.337463855743408e-05, 6.66007399559021e-05, 6.982684135437012e-05, 7.305294275283813e-05, 7.627904415130615e-05, 7.950514554977417e-05, 8.273124694824219e-05, 8.59573483467102e-05, 8.918344974517822e-05, 9.240955114364624e-05, 9.563565254211426e-05, 9.886175394058228e-05, 0.00010208785533905029, 0.00010531395673751831, 0.00010854005813598633]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 10.0, 10.0, 14.0, 12.0, 20.0, 25.0, 26.0, 44.0, 58.0, 63.0, 74.0, 83.0, 118.0, 126.0, 157.0, 226.0, 332.0, 527.0, 1289.0, 217665.0, 823049.0, 2369.0, 642.0, 440.0, 254.0, 193.0, 135.0, 109.0, 89.0, 80.0, 63.0, 45.0, 38.0, 22.0, 27.0, 17.0, 22.0, 17.0, 12.0, 10.0, 14.0, 4.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0021381378173828125, -0.002075508236885071, -0.002012878656387329, -0.0019502490758895874, -0.0018876194953918457, -0.001824989914894104, -0.0017623603343963623, -0.0016997307538986206, -0.001637101173400879, -0.0015744715929031372, -0.0015118420124053955, -0.0014492124319076538, -0.0013865828514099121, -0.0013239532709121704, -0.0012613236904144287, -0.001198694109916687, -0.0011360645294189453, -0.0010734349489212036, -0.001010805368423462, -0.0009481757879257202, -0.0008855462074279785, -0.0008229166269302368, -0.0007602870464324951, -0.0006976574659347534, -0.0006350278854370117, -0.00057239830493927, -0.0005097687244415283, -0.0004471391439437866, -0.0003845095634460449, -0.0003218799829483032, -0.0002592504024505615, -0.00019662082195281982, -0.00013399124145507812, -7.136166095733643e-05, -8.732080459594727e-06, 5.389750003814697e-05, 0.00011652708053588867, 0.00017915666103363037, 0.00024178624153137207, 0.00030441582202911377, 0.00036704540252685547, 0.00042967498302459717, 0.0004923045635223389, 0.0005549341440200806, 0.0006175637245178223, 0.000680193305015564, 0.0007428228855133057, 0.0008054524660110474, 0.0008680820465087891, 0.0009307116270065308, 0.0009933412075042725, 0.0010559707880020142, 0.0011186003684997559, 0.0011812299489974976, 0.0012438595294952393, 0.001306489109992981, 0.0013691186904907227, 0.0014317482709884644, 0.001494377851486206, 0.0015570074319839478, 0.0016196370124816895, 0.0016822665929794312, 0.0017448961734771729, 0.0018075257539749146, 0.0018701553344726562]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 24.0, 106.0, 240.0, 321.0, 211.0, 81.0, 25.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000263611989794299, -0.0002574029203969985, -0.0002511938218958676, -0.0002449847524985671, -0.0002387756685493514, -0.00023256658460013568, -0.00022635750065091997, -0.00022014841670170426, -0.00021393934730440378, -0.00020773026335518807, -0.00020152117940597236, -0.00019531211000867188, -0.00018910302605945617, -0.00018289394211024046, -0.00017668485816102475, -0.00017047577421180904, -0.00016426670481450856, -0.00015805762086529285, -0.00015184853691607714, -0.00014563946751877666, -0.00013943038356956095, -0.00013322129962034523, -0.00012701221567112952, -0.00012080313899787143, -0.0001145940477726981, -0.0001083849638234824, -0.0001021758871502243, -9.596680320100859e-05, -8.975772652775049e-05, -8.354864257853478e-05, -7.733955862931907e-05, -7.113048195606098e-05, -6.492140528280288e-05, -5.871232497156598e-05, -5.2503244660329074e-05, -4.6294160711113364e-05, -4.008508403785527e-05, -3.387600008863956e-05, -2.7666919777402654e-05, -2.145783946616575e-05, -1.5248759154928848e-05, -9.039678843691945e-06, -2.8305976229603402e-06, 3.3784835977712646e-06, 9.587563909008168e-06, 1.5796646039234474e-05, 2.2005726350471377e-05, 2.821480666170828e-05, 3.4423886972945184e-05, 4.0632967284182087e-05, 4.684204759541899e-05, 5.30511315446347e-05, 5.9260208217892796e-05, 6.54692921671085e-05, 7.16783688403666e-05, 7.788745278958231e-05, 8.409653673879802e-05, 9.030562068801373e-05, 9.651469736127183e-05, 0.00010272378131048754, 0.00010893285798374563, 0.00011514194193296134, 0.00012135102588217705, 0.00012756010983139277, 0.00013376917922869325]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 5.0, 7.0, 11.0, 16.0, 10.0, 15.0, 15.0, 18.0, 29.0, 30.0, 29.0, 26.0, 29.0, 36.0, 22.0, 56.0, 41.0, 40.0, 39.0, 47.0, 40.0, 49.0, 31.0, 29.0, 37.0, 29.0, 33.0, 35.0, 32.0, 24.0, 22.0, 18.0, 14.0, 21.0, 12.0, 9.0, 12.0, 7.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.598234176635742e-05, -6.400793790817261e-05, -6.203353404998779e-05, -6.005913019180298e-05, -5.8084726333618164e-05, -5.611032247543335e-05, -5.4135918617248535e-05, -5.216151475906372e-05, -5.0187110900878906e-05, -4.821270704269409e-05, -4.623830318450928e-05, -4.426389932632446e-05, -4.228949546813965e-05, -4.0315091609954834e-05, -3.834068775177002e-05, -3.6366283893585205e-05, -3.439188003540039e-05, -3.2417476177215576e-05, -3.0443072319030762e-05, -2.8468668460845947e-05, -2.6494264602661133e-05, -2.451986074447632e-05, -2.2545456886291504e-05, -2.057105302810669e-05, -1.8596649169921875e-05, -1.662224531173706e-05, -1.4647841453552246e-05, -1.2673437595367432e-05, -1.0699033737182617e-05, -8.724629878997803e-06, -6.750226020812988e-06, -4.775822162628174e-06, -2.8014183044433594e-06, -8.270144462585449e-07, 1.1473894119262695e-06, 3.121793270111084e-06, 5.0961971282958984e-06, 7.070600986480713e-06, 9.045004844665527e-06, 1.1019408702850342e-05, 1.2993812561035156e-05, 1.496821641921997e-05, 1.6942620277404785e-05, 1.89170241355896e-05, 2.0891427993774414e-05, 2.286583185195923e-05, 2.4840235710144043e-05, 2.6814639568328857e-05, 2.8789043426513672e-05, 3.0763447284698486e-05, 3.27378511428833e-05, 3.4712255001068115e-05, 3.668665885925293e-05, 3.8661062717437744e-05, 4.063546657562256e-05, 4.260987043380737e-05, 4.458427429199219e-05, 4.6558678150177e-05, 4.8533082008361816e-05, 5.050748586654663e-05, 5.2481889724731445e-05, 5.445629358291626e-05, 5.6430697441101074e-05, 5.840510129928589e-05, 6.03795051574707e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 9.0, 8.0, 15.0, 19.0, 15.0, 26.0, 24.0, 29.0, 25.0, 26.0, 24.0, 31.0, 39.0, 38.0, 33.0, 36.0, 37.0, 43.0, 47.0, 37.0, 36.0, 32.0, 37.0, 38.0, 29.0, 24.0, 29.0, 26.0, 19.0, 25.0, 24.0, 26.0, 10.0, 11.0, 7.0, 11.0, 9.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.3779296875, -1.339202880859375, -1.30047607421875, -1.261749267578125, -1.2230224609375, -1.184295654296875, -1.14556884765625, -1.106842041015625, -1.068115234375, -1.029388427734375, -0.99066162109375, -0.951934814453125, -0.9132080078125, -0.874481201171875, -0.83575439453125, -0.797027587890625, -0.75830078125, -0.719573974609375, -0.68084716796875, -0.642120361328125, -0.6033935546875, -0.564666748046875, -0.52593994140625, -0.487213134765625, -0.448486328125, -0.409759521484375, -0.37103271484375, -0.332305908203125, -0.2935791015625, -0.254852294921875, -0.21612548828125, -0.177398681640625, -0.138671875, -0.099945068359375, -0.06121826171875, -0.022491455078125, 0.0162353515625, 0.054962158203125, 0.09368896484375, 0.132415771484375, 0.171142578125, 0.209869384765625, 0.24859619140625, 0.287322998046875, 0.3260498046875, 0.364776611328125, 0.40350341796875, 0.442230224609375, 0.48095703125, 0.519683837890625, 0.55841064453125, 0.597137451171875, 0.6358642578125, 0.674591064453125, 0.71331787109375, 0.752044677734375, 0.790771484375, 0.829498291015625, 0.86822509765625, 0.906951904296875, 0.9456787109375, 0.984405517578125, 1.02313232421875, 1.061859130859375, 1.1005859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 11.0, 9.0, 17.0, 16.0, 23.0, 40.0, 61.0, 67.0, 112.0, 136.0, 203.0, 297.0, 405.0, 708.0, 1196.0, 2100.0, 4135.0, 8320.0, 18818.0, 45157.0, 109850.0, 233362.0, 300918.0, 182887.0, 79674.0, 32335.0, 13680.0, 6383.0, 3213.0, 1673.0, 961.0, 559.0, 374.0, 227.0, 198.0, 107.0, 88.0, 65.0, 41.0, 49.0, 24.0, 16.0, 15.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.763671875, -1.7137298583984375, -1.663787841796875, -1.6138458251953125, -1.56390380859375, -1.5139617919921875, -1.464019775390625, -1.4140777587890625, -1.3641357421875, -1.3141937255859375, -1.264251708984375, -1.2143096923828125, -1.16436767578125, -1.1144256591796875, -1.064483642578125, -1.0145416259765625, -0.964599609375, -0.9146575927734375, -0.864715576171875, -0.8147735595703125, -0.76483154296875, -0.7148895263671875, -0.664947509765625, -0.6150054931640625, -0.5650634765625, -0.5151214599609375, -0.465179443359375, -0.4152374267578125, -0.36529541015625, -0.3153533935546875, -0.265411376953125, -0.2154693603515625, -0.16552734375, -0.1155853271484375, -0.065643310546875, -0.0157012939453125, 0.03424072265625, 0.0841827392578125, 0.134124755859375, 0.1840667724609375, 0.2340087890625, 0.2839508056640625, 0.333892822265625, 0.3838348388671875, 0.43377685546875, 0.4837188720703125, 0.533660888671875, 0.5836029052734375, 0.633544921875, 0.6834869384765625, 0.733428955078125, 0.7833709716796875, 0.83331298828125, 0.8832550048828125, 0.933197021484375, 0.9831390380859375, 1.0330810546875, 1.0830230712890625, 1.132965087890625, 1.1829071044921875, 1.23284912109375, 1.2827911376953125, 1.332733154296875, 1.3826751708984375, 1.4326171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 3.0, 5.0, 12.0, 15.0, 11.0, 13.0, 20.0, 25.0, 23.0, 35.0, 30.0, 38.0, 46.0, 46.0, 59.0, 86.0, 154.0, 315.0, 1390.0, 197.0, 99.0, 67.0, 51.0, 40.0, 38.0, 37.0, 24.0, 23.0, 18.0, 26.0, 18.0, 10.0, 16.0, 8.0, 7.0, 10.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.67431640625, -4.5244140625, -4.37451171875, -4.224609375, -4.07470703125, -3.9248046875, -3.77490234375, -3.625, -3.47509765625, -3.3251953125, -3.17529296875, -3.025390625, -2.87548828125, -2.7255859375, -2.57568359375, -2.42578125, -2.27587890625, -2.1259765625, -1.97607421875, -1.826171875, -1.67626953125, -1.5263671875, -1.37646484375, -1.2265625, -1.07666015625, -0.9267578125, -0.77685546875, -0.626953125, -0.47705078125, -0.3271484375, -0.17724609375, -0.02734375, 0.12255859375, 0.2724609375, 0.42236328125, 0.572265625, 0.72216796875, 0.8720703125, 1.02197265625, 1.171875, 1.32177734375, 1.4716796875, 1.62158203125, 1.771484375, 1.92138671875, 2.0712890625, 2.22119140625, 2.37109375, 2.52099609375, 2.6708984375, 2.82080078125, 2.970703125, 3.12060546875, 3.2705078125, 3.42041015625, 3.5703125, 3.72021484375, 3.8701171875, 4.02001953125, 4.169921875, 4.31982421875, 4.4697265625, 4.61962890625, 4.76953125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 11.0, 7.0, 15.0, 12.0, 10.0, 16.0, 18.0, 23.0, 25.0, 37.0, 51.0, 73.0, 103.0, 155.0, 290.0, 572.0, 1856.0, 24930.0, 2746057.0, 363908.0, 5446.0, 961.0, 404.0, 228.0, 131.0, 90.0, 62.0, 45.0, 23.0, 29.0, 22.0, 17.0, 18.0, 12.0, 15.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.65625, -9.352294921875, -9.04833984375, -8.744384765625, -8.4404296875, -8.136474609375, -7.83251953125, -7.528564453125, -7.224609375, -6.920654296875, -6.61669921875, -6.312744140625, -6.0087890625, -5.704833984375, -5.40087890625, -5.096923828125, -4.79296875, -4.489013671875, -4.18505859375, -3.881103515625, -3.5771484375, -3.273193359375, -2.96923828125, -2.665283203125, -2.361328125, -2.057373046875, -1.75341796875, -1.449462890625, -1.1455078125, -0.841552734375, -0.53759765625, -0.233642578125, 0.0703125, 0.374267578125, 0.67822265625, 0.982177734375, 1.2861328125, 1.590087890625, 1.89404296875, 2.197998046875, 2.501953125, 2.805908203125, 3.10986328125, 3.413818359375, 3.7177734375, 4.021728515625, 4.32568359375, 4.629638671875, 4.93359375, 5.237548828125, 5.54150390625, 5.845458984375, 6.1494140625, 6.453369140625, 6.75732421875, 7.061279296875, 7.365234375, 7.669189453125, 7.97314453125, 8.277099609375, 8.5810546875, 8.885009765625, 9.18896484375, 9.492919921875, 9.796875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 30.0, 100.0, 245.0, 326.0, 214.0, 72.0, 15.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.365718841552734, -26.832176208496094, -26.298633575439453, -25.765090942382812, -25.231548309326172, -24.698007583618164, -24.164464950561523, -23.630922317504883, -23.097379684448242, -22.5638370513916, -22.03029441833496, -21.49675178527832, -20.963211059570312, -20.429668426513672, -19.89612579345703, -19.36258316040039, -18.82904052734375, -18.29549789428711, -17.76195526123047, -17.228412628173828, -16.694869995117188, -16.16132926940918, -15.627786636352539, -15.094244003295898, -14.560701370239258, -14.027158737182617, -13.493616104125977, -12.960074424743652, -12.426531791687012, -11.892989158630371, -11.359447479248047, -10.825904846191406, -10.292362213134766, -9.758819580078125, -9.225276947021484, -8.69173526763916, -8.15819263458252, -7.624650001525879, -7.0911078453063965, -6.557565689086914, -6.024022579193115, -5.490480422973633, -4.956937789916992, -4.423395156860352, -3.889853000640869, -3.3563106060028076, -2.822768211364746, -2.2892258167266846, -1.755683422088623, -1.2221410274505615, -0.6885986328125, -0.15505623817443848, 0.37848615646362305, 0.9120285511016846, 1.445570945739746, 1.9791133403778076, 2.512655735015869, 3.0461981296539307, 3.579740524291992, 4.113283157348633, 4.646825313568115, 5.180367469787598, 5.713910102844238, 6.247452735900879, 6.780994892120361]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 5.0, 7.0, 8.0, 7.0, 15.0, 12.0, 12.0, 10.0, 21.0, 19.0, 18.0, 27.0, 31.0, 35.0, 40.0, 25.0, 37.0, 46.0, 39.0, 28.0, 42.0, 32.0, 32.0, 31.0, 31.0, 37.0, 36.0, 29.0, 34.0, 33.0, 32.0, 29.0, 13.0, 29.0, 19.0, 9.0, 11.0, 14.0, 9.0, 12.0, 8.0, 10.0, 9.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.07627010345459, -12.650373458862305, -12.224477767944336, -11.79858112335205, -11.372684478759766, -10.946788787841797, -10.520892143249512, -10.094995498657227, -9.669099807739258, -9.243203163146973, -8.817307472229004, -8.391410827636719, -7.965514659881592, -7.539618492126465, -7.11372184753418, -6.687825679779053, -6.261929035186768, -5.836032867431641, -5.4101362228393555, -4.9842400550842285, -4.558343887329102, -4.132447242736816, -3.7065510749816895, -3.2806549072265625, -2.8547585010528564, -2.4288620948791504, -2.0029659271240234, -1.5770695209503174, -1.1511732339859009, -0.7252769470214844, -0.2993805408477783, 0.12651562690734863, 0.5524120330810547, 0.9783083200454712, 1.4042046070098877, 1.8301010131835938, 2.2559971809387207, 2.6818935871124268, 3.107789993286133, 3.5336861610412598, 3.959582567214966, 4.385478973388672, 4.811375141143799, 5.237271308898926, 5.663167953491211, 6.089064121246338, 6.514960289001465, 6.94085693359375, 7.366753101348877, 7.792649269104004, 8.218545913696289, 8.644441604614258, 9.070338249206543, 9.496234893798828, 9.922130584716797, 10.348027229309082, 10.773923873901367, 11.199820518493652, 11.625716209411621, 12.051612854003906, 12.477509498596191, 12.90340518951416, 13.329301834106445, 13.755197525024414, 14.1810941696167]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 4.0, 5.0, 10.0, 3.0, 12.0, 15.0, 15.0, 20.0, 26.0, 22.0, 23.0, 28.0, 25.0, 36.0, 27.0, 37.0, 36.0, 47.0, 35.0, 47.0, 42.0, 47.0, 37.0, 33.0, 30.0, 36.0, 33.0, 37.0, 29.0, 28.0, 28.0, 21.0, 14.0, 18.0, 19.0, 15.0, 12.0, 11.0, 9.0, 8.0, 7.0, 1.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.5, -1.4578704833984375, -1.415740966796875, -1.3736114501953125, -1.33148193359375, -1.2893524169921875, -1.247222900390625, -1.2050933837890625, -1.1629638671875, -1.1208343505859375, -1.078704833984375, -1.0365753173828125, -0.99444580078125, -0.9523162841796875, -0.910186767578125, -0.8680572509765625, -0.825927734375, -0.7837982177734375, -0.741668701171875, -0.6995391845703125, -0.65740966796875, -0.6152801513671875, -0.573150634765625, -0.5310211181640625, -0.4888916015625, -0.4467620849609375, -0.404632568359375, -0.3625030517578125, -0.32037353515625, -0.2782440185546875, -0.236114501953125, -0.1939849853515625, -0.15185546875, -0.1097259521484375, -0.067596435546875, -0.0254669189453125, 0.01666259765625, 0.0587921142578125, 0.100921630859375, 0.1430511474609375, 0.1851806640625, 0.2273101806640625, 0.269439697265625, 0.3115692138671875, 0.35369873046875, 0.3958282470703125, 0.437957763671875, 0.4800872802734375, 0.522216796875, 0.5643463134765625, 0.606475830078125, 0.6486053466796875, 0.69073486328125, 0.7328643798828125, 0.774993896484375, 0.8171234130859375, 0.8592529296875, 0.9013824462890625, 0.943511962890625, 0.9856414794921875, 1.02777099609375, 1.0699005126953125, 1.112030029296875, 1.1541595458984375, 1.1962890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 6.0, 13.0, 14.0, 14.0, 20.0, 19.0, 38.0, 52.0, 56.0, 78.0, 106.0, 180.0, 341.0, 752.0, 2231.0, 9942.0, 75733.0, 1169697.0, 2659620.0, 245612.0, 23152.0, 4187.0, 1185.0, 468.0, 200.0, 161.0, 100.0, 55.0, 57.0, 50.0, 23.0, 16.0, 17.0, 14.0, 11.0, 21.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.65234375, -4.50335693359375, -4.3543701171875, -4.20538330078125, -4.056396484375, -3.90740966796875, -3.7584228515625, -3.60943603515625, -3.46044921875, -3.31146240234375, -3.1624755859375, -3.01348876953125, -2.864501953125, -2.71551513671875, -2.5665283203125, -2.41754150390625, -2.2685546875, -2.11956787109375, -1.9705810546875, -1.82159423828125, -1.672607421875, -1.52362060546875, -1.3746337890625, -1.22564697265625, -1.07666015625, -0.92767333984375, -0.7786865234375, -0.62969970703125, -0.480712890625, -0.33172607421875, -0.1827392578125, -0.03375244140625, 0.115234375, 0.26422119140625, 0.4132080078125, 0.56219482421875, 0.711181640625, 0.86016845703125, 1.0091552734375, 1.15814208984375, 1.30712890625, 1.45611572265625, 1.6051025390625, 1.75408935546875, 1.903076171875, 2.05206298828125, 2.2010498046875, 2.35003662109375, 2.4990234375, 2.64801025390625, 2.7969970703125, 2.94598388671875, 3.094970703125, 3.24395751953125, 3.3929443359375, 3.54193115234375, 3.69091796875, 3.83990478515625, 3.9888916015625, 4.13787841796875, 4.286865234375, 4.43585205078125, 4.5848388671875, 4.73382568359375, 4.8828125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 14.0, 19.0, 25.0, 43.0, 65.0, 111.0, 189.0, 287.0, 429.0, 561.0, 639.0, 530.0, 420.0, 256.0, 172.0, 113.0, 75.0, 62.0, 22.0, 10.0, 8.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.667510986328125, -8.46783447265625, -8.268157958984375, -8.0684814453125, -7.868804931640625, -7.66912841796875, -7.469451904296875, -7.269775390625, -7.070098876953125, -6.87042236328125, -6.670745849609375, -6.4710693359375, -6.271392822265625, -6.07171630859375, -5.872039794921875, -5.67236328125, -5.472686767578125, -5.27301025390625, -5.073333740234375, -4.8736572265625, -4.673980712890625, -4.47430419921875, -4.274627685546875, -4.074951171875, -3.875274658203125, -3.67559814453125, -3.475921630859375, -3.2762451171875, -3.076568603515625, -2.87689208984375, -2.677215576171875, -2.4775390625, -2.277862548828125, -2.07818603515625, -1.878509521484375, -1.6788330078125, -1.479156494140625, -1.27947998046875, -1.079803466796875, -0.880126953125, -0.680450439453125, -0.48077392578125, -0.281097412109375, -0.0814208984375, 0.118255615234375, 0.31793212890625, 0.517608642578125, 0.71728515625, 0.916961669921875, 1.11663818359375, 1.316314697265625, 1.5159912109375, 1.715667724609375, 1.91534423828125, 2.115020751953125, 2.314697265625, 2.514373779296875, 2.71405029296875, 2.913726806640625, 3.1134033203125, 3.313079833984375, 3.51275634765625, 3.712432861328125, 3.912109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 9.0, 16.0, 17.0, 51.0, 77.0, 138.0, 201.0, 445.0, 969.0, 5580.0, 250136.0, 3817389.0, 113831.0, 3874.0, 828.0, 314.0, 150.0, 106.0, 49.0, 30.0, 17.0, 21.0, 7.0, 7.0, 4.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.24267578125, -10.7822265625, -10.32177734375, -9.861328125, -9.40087890625, -8.9404296875, -8.47998046875, -8.01953125, -7.55908203125, -7.0986328125, -6.63818359375, -6.177734375, -5.71728515625, -5.2568359375, -4.79638671875, -4.3359375, -3.87548828125, -3.4150390625, -2.95458984375, -2.494140625, -2.03369140625, -1.5732421875, -1.11279296875, -0.65234375, -0.19189453125, 0.2685546875, 0.72900390625, 1.189453125, 1.64990234375, 2.1103515625, 2.57080078125, 3.03125, 3.49169921875, 3.9521484375, 4.41259765625, 4.873046875, 5.33349609375, 5.7939453125, 6.25439453125, 6.71484375, 7.17529296875, 7.6357421875, 8.09619140625, 8.556640625, 9.01708984375, 9.4775390625, 9.93798828125, 10.3984375, 10.85888671875, 11.3193359375, 11.77978515625, 12.240234375, 12.70068359375, 13.1611328125, 13.62158203125, 14.08203125, 14.54248046875, 15.0029296875, 15.46337890625, 15.923828125, 16.38427734375, 16.8447265625, 17.30517578125, 17.765625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 26.0, 42.0, 95.0, 138.0, 178.0, 174.0, 158.0, 92.0, 61.0, 29.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.693729400634766, -36.87528610229492, -36.05684280395508, -35.238399505615234, -34.41995620727539, -33.60151290893555, -32.7830696105957, -31.964624404907227, -31.146181106567383, -30.32773780822754, -29.509294509887695, -28.69085121154785, -27.872407913208008, -27.05396270751953, -26.235519409179688, -25.417076110839844, -24.5986328125, -23.780189514160156, -22.961746215820312, -22.14330291748047, -21.324859619140625, -20.50641632080078, -19.687973022460938, -18.86952781677246, -18.05108642578125, -17.232643127441406, -16.414199829101562, -15.595756530761719, -14.777312278747559, -13.958868980407715, -13.140425682067871, -12.321981430053711, -11.50353717803955, -10.685093879699707, -9.866650581359863, -9.048206329345703, -8.22976303100586, -7.411319732666016, -6.592876434326172, -5.77443265914917, -4.955989360809326, -4.137546062469482, -3.3191022872924805, -2.5006589889526367, -1.6822154521942139, -0.863771915435791, -0.045328617095947266, 0.7731151580810547, 1.5915584564208984, 2.4100019931793213, 3.228445529937744, 4.046888828277588, 4.86533260345459, 5.683775901794434, 6.502219200134277, 7.320662975311279, 8.139106750488281, 8.957550048828125, 9.775993347167969, 10.594436645507812, 11.412880897521973, 12.231324195861816, 13.04976749420166, 13.86821174621582, 14.686654090881348]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 2.0, 6.0, 8.0, 8.0, 9.0, 6.0, 11.0, 16.0, 20.0, 20.0, 13.0, 22.0, 22.0, 34.0, 40.0, 39.0, 29.0, 48.0, 29.0, 40.0, 41.0, 42.0, 52.0, 45.0, 50.0, 37.0, 38.0, 34.0, 35.0, 39.0, 22.0, 24.0, 21.0, 18.0, 14.0, 13.0, 8.0, 15.0, 11.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.780960083007812, -12.321908950805664, -11.8628568649292, -11.40380573272705, -10.944753646850586, -10.485702514648438, -10.026651382446289, -9.567599296569824, -9.10854721069336, -8.649496078491211, -8.190443992614746, -7.731392860412598, -7.272340774536133, -6.813289642333984, -6.354238033294678, -5.895186424255371, -5.436135292053223, -4.977083683013916, -4.518032073974609, -4.058980941772461, -3.599929094314575, -3.1408774852752686, -2.681826114654541, -2.2227745056152344, -1.7637228965759277, -1.304671287536621, -0.845619797706604, -0.3865683078765869, 0.07248330116271973, 0.5315349102020264, 0.9905862808227539, 1.4496378898620605, 1.9086894989013672, 2.367741107940674, 2.8267927169799805, 3.285844087600708, 3.7448956966400146, 4.203947067260742, 4.662998676300049, 5.1220502853393555, 5.581101894378662, 6.040153503417969, 6.499205112457275, 6.958256721496582, 7.4173078536987305, 7.876359939575195, 8.335411071777344, 8.794462203979492, 9.253514289855957, 9.712565422058105, 10.17161750793457, 10.630668640136719, 11.089720726013184, 11.548771858215332, 12.007823944091797, 12.466875076293945, 12.925926208496094, 13.384977340698242, 13.844029426574707, 14.303080558776855, 14.76213264465332, 15.221183776855469, 15.680234909057617, 16.139286041259766, 16.598339080810547]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 1.0, 10.0, 6.0, 13.0, 9.0, 16.0, 12.0, 13.0, 15.0, 31.0, 25.0, 21.0, 26.0, 37.0, 35.0, 37.0, 43.0, 46.0, 28.0, 52.0, 45.0, 41.0, 48.0, 39.0, 37.0, 44.0, 33.0, 30.0, 35.0, 27.0, 20.0, 22.0, 19.0, 16.0, 14.0, 8.0, 7.0, 10.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5255889892578125, -1.479888916015625, -1.4341888427734375, -1.38848876953125, -1.3427886962890625, -1.297088623046875, -1.2513885498046875, -1.2056884765625, -1.1599884033203125, -1.114288330078125, -1.0685882568359375, -1.02288818359375, -0.9771881103515625, -0.931488037109375, -0.8857879638671875, -0.840087890625, -0.7943878173828125, -0.748687744140625, -0.7029876708984375, -0.65728759765625, -0.6115875244140625, -0.565887451171875, -0.5201873779296875, -0.4744873046875, -0.4287872314453125, -0.383087158203125, -0.3373870849609375, -0.29168701171875, -0.2459869384765625, -0.200286865234375, -0.1545867919921875, -0.10888671875, -0.0631866455078125, -0.017486572265625, 0.0282135009765625, 0.07391357421875, 0.1196136474609375, 0.165313720703125, 0.2110137939453125, 0.2567138671875, 0.3024139404296875, 0.348114013671875, 0.3938140869140625, 0.43951416015625, 0.4852142333984375, 0.530914306640625, 0.5766143798828125, 0.622314453125, 0.6680145263671875, 0.713714599609375, 0.7594146728515625, 0.80511474609375, 0.8508148193359375, 0.896514892578125, 0.9422149658203125, 0.9879150390625, 1.0336151123046875, 1.079315185546875, 1.1250152587890625, 1.17071533203125, 1.2164154052734375, 1.262115478515625, 1.3078155517578125, 1.353515625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 7.0, 19.0, 17.0, 28.0, 43.0, 69.0, 92.0, 163.0, 239.0, 372.0, 528.0, 827.0, 1158.0, 1796.0, 2686.0, 4127.0, 6341.0, 9832.0, 15289.0, 24334.0, 39818.0, 68350.0, 134376.0, 311537.0, 200655.0, 91117.0, 50681.0, 30392.0, 18971.0, 12096.0, 7802.0, 4993.0, 3337.0, 2127.0, 1415.0, 980.0, 673.0, 461.0, 263.0, 184.0, 137.0, 78.0, 54.0, 36.0, 20.0, 15.0, 5.0, 8.0, 3.0, 2.0, 6.0, 1.0, 2.0], "bins": [-0.301025390625, -0.2923583984375, -0.28369140625, -0.2750244140625, -0.266357421875, -0.2576904296875, -0.2490234375, -0.2403564453125, -0.231689453125, -0.2230224609375, -0.21435546875, -0.2056884765625, -0.197021484375, -0.1883544921875, -0.1796875, -0.1710205078125, -0.162353515625, -0.1536865234375, -0.14501953125, -0.1363525390625, -0.127685546875, -0.1190185546875, -0.1103515625, -0.1016845703125, -0.093017578125, -0.0843505859375, -0.07568359375, -0.0670166015625, -0.058349609375, -0.0496826171875, -0.041015625, -0.0323486328125, -0.023681640625, -0.0150146484375, -0.00634765625, 0.0023193359375, 0.010986328125, 0.0196533203125, 0.0283203125, 0.0369873046875, 0.045654296875, 0.0543212890625, 0.06298828125, 0.0716552734375, 0.080322265625, 0.0889892578125, 0.09765625, 0.1063232421875, 0.114990234375, 0.1236572265625, 0.13232421875, 0.1409912109375, 0.149658203125, 0.1583251953125, 0.1669921875, 0.1756591796875, 0.184326171875, 0.1929931640625, 0.20166015625, 0.2103271484375, 0.218994140625, 0.2276611328125, 0.236328125, 0.2449951171875, 0.253662109375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 13.0, 7.0, 9.0, 12.0, 14.0, 17.0, 14.0, 27.0, 27.0, 18.0, 29.0, 31.0, 33.0, 42.0, 29.0, 45.0, 35.0, 47.0, 1056.0, 47.0, 43.0, 45.0, 29.0, 43.0, 31.0, 47.0, 23.0, 30.0, 35.0, 24.0, 33.0, 17.0, 8.0, 16.0, 15.0, 3.0, 14.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.88671875, -0.8589859008789062, -0.8312530517578125, -0.8035202026367188, -0.775787353515625, -0.7480545043945312, -0.7203216552734375, -0.6925888061523438, -0.66485595703125, -0.6371231079101562, -0.6093902587890625, -0.5816574096679688, -0.553924560546875, -0.5261917114257812, -0.4984588623046875, -0.47072601318359375, -0.4429931640625, -0.41526031494140625, -0.3875274658203125, -0.35979461669921875, -0.332061767578125, -0.30432891845703125, -0.2765960693359375, -0.24886322021484375, -0.22113037109375, -0.19339752197265625, -0.1656646728515625, -0.13793182373046875, -0.110198974609375, -0.08246612548828125, -0.0547332763671875, -0.02700042724609375, 0.000732421875, 0.02846527099609375, 0.0561981201171875, 0.08393096923828125, 0.111663818359375, 0.13939666748046875, 0.1671295166015625, 0.19486236572265625, 0.22259521484375, 0.25032806396484375, 0.2780609130859375, 0.30579376220703125, 0.333526611328125, 0.36125946044921875, 0.3889923095703125, 0.41672515869140625, 0.4444580078125, 0.47219085693359375, 0.4999237060546875, 0.5276565551757812, 0.555389404296875, 0.5831222534179688, 0.6108551025390625, 0.6385879516601562, 0.66632080078125, 0.6940536499023438, 0.7217864990234375, 0.7495193481445312, 0.777252197265625, 0.8049850463867188, 0.8327178955078125, 0.8604507446289062, 0.88818359375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 14.0, 21.0, 25.0, 38.0, 62.0, 78.0, 121.0, 186.0, 257.0, 402.0, 610.0, 901.0, 1438.0, 2098.0, 3247.0, 5145.0, 7987.0, 12615.0, 19977.0, 33368.0, 55336.0, 99462.0, 209679.0, 1333621.0, 132897.0, 69595.0, 40969.0, 24646.0, 15078.0, 9653.0, 6208.0, 3974.0, 2524.0, 1687.0, 1079.0, 693.0, 445.0, 313.0, 206.0, 144.0, 100.0, 65.0, 48.0, 40.0, 29.0, 18.0, 9.0, 7.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2445068359375, -0.23691558837890625, -0.2293243408203125, -0.22173309326171875, -0.214141845703125, -0.20655059814453125, -0.1989593505859375, -0.19136810302734375, -0.18377685546875, -0.17618560791015625, -0.1685943603515625, -0.16100311279296875, -0.153411865234375, -0.14582061767578125, -0.1382293701171875, -0.13063812255859375, -0.123046875, -0.11545562744140625, -0.1078643798828125, -0.10027313232421875, -0.092681884765625, -0.08509063720703125, -0.0774993896484375, -0.06990814208984375, -0.06231689453125, -0.05472564697265625, -0.0471343994140625, -0.03954315185546875, -0.031951904296875, -0.02436065673828125, -0.0167694091796875, -0.00917816162109375, -0.0015869140625, 0.00600433349609375, 0.0135955810546875, 0.02118682861328125, 0.028778076171875, 0.03636932373046875, 0.0439605712890625, 0.05155181884765625, 0.05914306640625, 0.06673431396484375, 0.0743255615234375, 0.08191680908203125, 0.089508056640625, 0.09709930419921875, 0.1046905517578125, 0.11228179931640625, 0.119873046875, 0.12746429443359375, 0.1350555419921875, 0.14264678955078125, 0.150238037109375, 0.15782928466796875, 0.1654205322265625, 0.17301177978515625, 0.18060302734375, 0.18819427490234375, 0.1957855224609375, 0.20337677001953125, 0.210968017578125, 0.21855926513671875, 0.2261505126953125, 0.23374176025390625, 0.2413330078125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 6.0, 6.0, 4.0, 5.0, 8.0, 12.0, 11.0, 8.0, 21.0, 25.0, 19.0, 30.0, 26.0, 40.0, 43.0, 47.0, 46.0, 44.0, 46.0, 55.0, 55.0, 51.0, 55.0, 40.0, 43.0, 38.0, 40.0, 31.0, 22.0, 18.0, 20.0, 15.0, 19.0, 12.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0001678466796875, -0.00016313977539539337, -0.00015843287110328674, -0.00015372596681118011, -0.00014901906251907349, -0.00014431215822696686, -0.00013960525393486023, -0.0001348983496427536, -0.00013019144535064697, -0.00012548454105854034, -0.00012077763676643372, -0.00011607073247432709, -0.00011136382818222046, -0.00010665692389011383, -0.0001019500195980072, -9.724311530590057e-05, -9.253621101379395e-05, -8.782930672168732e-05, -8.312240242958069e-05, -7.841549813747406e-05, -7.370859384536743e-05, -6.90016895532608e-05, -6.429478526115417e-05, -5.9587880969047546e-05, -5.488097667694092e-05, -5.017407238483429e-05, -4.546716809272766e-05, -4.076026380062103e-05, -3.6053359508514404e-05, -3.1346455216407776e-05, -2.6639550924301147e-05, -2.193264663219452e-05, -1.722574234008789e-05, -1.2518838047981262e-05, -7.811933755874634e-06, -3.1050294637680054e-06, 1.601874828338623e-06, 6.3087791204452515e-06, 1.101568341255188e-05, 1.5722587704658508e-05, 2.0429491996765137e-05, 2.5136396288871765e-05, 2.9843300580978394e-05, 3.455020487308502e-05, 3.925710916519165e-05, 4.396401345729828e-05, 4.867091774940491e-05, 5.3377822041511536e-05, 5.8084726333618164e-05, 6.279163062572479e-05, 6.749853491783142e-05, 7.220543920993805e-05, 7.691234350204468e-05, 8.16192477941513e-05, 8.632615208625793e-05, 9.103305637836456e-05, 9.573996067047119e-05, 0.00010044686496257782, 0.00010515376925468445, 0.00010986067354679108, 0.0001145675778388977, 0.00011927448213100433, 0.00012398138642311096, 0.0001286882907152176, 0.00013339519500732422]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 12.0, 10.0, 17.0, 12.0, 20.0, 35.0, 27.0, 54.0, 64.0, 79.0, 101.0, 124.0, 161.0, 206.0, 323.0, 548.0, 2892.0, 980844.0, 60567.0, 947.0, 408.0, 295.0, 195.0, 153.0, 93.0, 95.0, 54.0, 53.0, 34.0, 25.0, 40.0, 13.0, 18.0, 6.0, 5.0, 4.0, 2.0, 0.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025768280029296875, -0.0024839043617248535, -0.0023909807205200195, -0.0022980570793151855, -0.0022051334381103516, -0.0021122097969055176, -0.0020192861557006836, -0.0019263625144958496, -0.0018334388732910156, -0.0017405152320861816, -0.0016475915908813477, -0.0015546679496765137, -0.0014617443084716797, -0.0013688206672668457, -0.0012758970260620117, -0.0011829733848571777, -0.0010900497436523438, -0.0009971261024475098, -0.0009042024612426758, -0.0008112788200378418, -0.0007183551788330078, -0.0006254315376281738, -0.0005325078964233398, -0.00043958425521850586, -0.0003466606140136719, -0.0002537369728088379, -0.0001608133316040039, -6.788969039916992e-05, 2.5033950805664062e-05, 0.00011795759201049805, 0.00021088123321533203, 0.000303804874420166, 0.000396728515625, 0.000489652156829834, 0.000582575798034668, 0.000675499439239502, 0.0007684230804443359, 0.0008613467216491699, 0.0009542703628540039, 0.0010471940040588379, 0.0011401176452636719, 0.0012330412864685059, 0.0013259649276733398, 0.0014188885688781738, 0.0015118122100830078, 0.0016047358512878418, 0.0016976594924926758, 0.0017905831336975098, 0.0018835067749023438, 0.0019764304161071777, 0.0020693540573120117, 0.0021622776985168457, 0.0022552013397216797, 0.0023481249809265137, 0.0024410486221313477, 0.0025339722633361816, 0.0026268959045410156, 0.0027198195457458496, 0.0028127431869506836, 0.0029056668281555176, 0.0029985904693603516, 0.0030915141105651855, 0.0031844377517700195, 0.0032773613929748535, 0.0033702850341796875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 45.0, 175.0, 337.0, 286.0, 121.0, 39.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024024049344006926, -0.00023130580666474998, -0.00022237110533751547, -0.0002134364185621962, -0.00020450173178687692, -0.0001955670304596424, -0.00018663234368432313, -0.00017769765690900385, -0.00016876295558176935, -0.00015982826880645007, -0.00015089356747921556, -0.00014195888070389628, -0.000133024193928577, -0.00012408950715325773, -0.00011515480582602322, -0.00010622011905070394, -9.728543227538466e-05, -8.835073822410777e-05, -7.94160514487885e-05, -7.04813573975116e-05, -6.154667062219232e-05, -5.261197657091543e-05, -4.367728251963854e-05, -3.474259574431926e-05, -2.5807901693042368e-05, -1.6873211279744282e-05, -7.938519047456793e-06, 9.961731848306954e-07, 9.93086359812878e-06, 1.8865554011426866e-05, 2.780024806270376e-05, 3.673493483802304e-05, 4.566964344121516e-05, 5.460433385451324e-05, 6.353902426781133e-05, 7.247371831908822e-05, 8.14084050944075e-05, 9.034309914568439e-05, 9.927779319696128e-05, 0.00010821247997228056, 0.00011714717402355745, 0.00012608186807483435, 0.00013501655485015363, 0.0001439512416254729, 0.0001528859429527074, 0.0001618206297280267, 0.00017075531650334597, 0.00017969001783058047, 0.00018862470460589975, 0.00019755939138121903, 0.00020649409270845354, 0.00021542877948377281, 0.0002243634662590921, 0.0002332981675863266, 0.00024223285436164588, 0.00025116754113696516, 0.00026010224246419966, 0.00026903694379143417, 0.0002779716160148382, 0.0002869063173420727, 0.00029584101866930723, 0.0003047756908927113, 0.0003137103922199458, 0.00032264506444334984, 0.00033157976577058434]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 7.0, 8.0, 11.0, 13.0, 26.0, 17.0, 25.0, 26.0, 22.0, 25.0, 28.0, 35.0, 35.0, 33.0, 24.0, 48.0, 43.0, 42.0, 41.0, 54.0, 30.0, 45.0, 41.0, 28.0, 30.0, 32.0, 16.0, 39.0, 21.0, 29.0, 21.0, 18.0, 16.0, 15.0, 10.0, 13.0, 5.0, 4.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.417533874511719e-05, -9.147822856903076e-05, -8.878111839294434e-05, -8.608400821685791e-05, -8.338689804077148e-05, -8.068978786468506e-05, -7.799267768859863e-05, -7.529556751251221e-05, -7.259845733642578e-05, -6.990134716033936e-05, -6.720423698425293e-05, -6.45071268081665e-05, -6.181001663208008e-05, -5.911290645599365e-05, -5.6415796279907227e-05, -5.37186861038208e-05, -5.1021575927734375e-05, -4.832446575164795e-05, -4.5627355575561523e-05, -4.29302453994751e-05, -4.023313522338867e-05, -3.7536025047302246e-05, -3.483891487121582e-05, -3.2141804695129395e-05, -2.944469451904297e-05, -2.6747584342956543e-05, -2.4050474166870117e-05, -2.135336399078369e-05, -1.8656253814697266e-05, -1.595914363861084e-05, -1.3262033462524414e-05, -1.0564923286437988e-05, -7.867813110351562e-06, -5.170702934265137e-06, -2.473592758178711e-06, 2.2351741790771484e-07, 2.9206275939941406e-06, 5.617737770080566e-06, 8.314847946166992e-06, 1.1011958122253418e-05, 1.3709068298339844e-05, 1.640617847442627e-05, 1.9103288650512695e-05, 2.180039882659912e-05, 2.4497509002685547e-05, 2.7194619178771973e-05, 2.98917293548584e-05, 3.2588839530944824e-05, 3.528594970703125e-05, 3.7983059883117676e-05, 4.06801700592041e-05, 4.337728023529053e-05, 4.607439041137695e-05, 4.877150058746338e-05, 5.1468610763549805e-05, 5.416572093963623e-05, 5.6862831115722656e-05, 5.955994129180908e-05, 6.225705146789551e-05, 6.495416164398193e-05, 6.765127182006836e-05, 7.034838199615479e-05, 7.304549217224121e-05, 7.574260234832764e-05, 7.843971252441406e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 1.0, 10.0, 6.0, 13.0, 9.0, 16.0, 12.0, 13.0, 15.0, 31.0, 25.0, 21.0, 26.0, 37.0, 35.0, 37.0, 43.0, 46.0, 28.0, 52.0, 45.0, 41.0, 48.0, 39.0, 37.0, 44.0, 33.0, 30.0, 35.0, 27.0, 20.0, 22.0, 19.0, 16.0, 14.0, 8.0, 7.0, 10.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5255889892578125, -1.479888916015625, -1.4341888427734375, -1.38848876953125, -1.3427886962890625, -1.297088623046875, -1.2513885498046875, -1.2056884765625, -1.1599884033203125, -1.114288330078125, -1.0685882568359375, -1.02288818359375, -0.9771881103515625, -0.931488037109375, -0.8857879638671875, -0.840087890625, -0.7943878173828125, -0.748687744140625, -0.7029876708984375, -0.65728759765625, -0.6115875244140625, -0.565887451171875, -0.5201873779296875, -0.4744873046875, -0.4287872314453125, -0.383087158203125, -0.3373870849609375, -0.29168701171875, -0.2459869384765625, -0.200286865234375, -0.1545867919921875, -0.10888671875, -0.0631866455078125, -0.017486572265625, 0.0282135009765625, 0.07391357421875, 0.1196136474609375, 0.165313720703125, 0.2110137939453125, 0.2567138671875, 0.3024139404296875, 0.348114013671875, 0.3938140869140625, 0.43951416015625, 0.4852142333984375, 0.530914306640625, 0.5766143798828125, 0.622314453125, 0.6680145263671875, 0.713714599609375, 0.7594146728515625, 0.80511474609375, 0.8508148193359375, 0.896514892578125, 0.9422149658203125, 0.9879150390625, 1.0336151123046875, 1.079315185546875, 1.1250152587890625, 1.17071533203125, 1.2164154052734375, 1.262115478515625, 1.3078155517578125, 1.353515625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 7.0, 8.0, 15.0, 15.0, 15.0, 36.0, 41.0, 56.0, 84.0, 93.0, 117.0, 144.0, 237.0, 312.0, 386.0, 677.0, 1065.0, 1561.0, 2738.0, 4788.0, 8808.0, 17480.0, 36762.0, 86699.0, 216883.0, 357714.0, 176669.0, 70469.0, 30908.0, 15003.0, 7761.0, 4166.0, 2349.0, 1490.0, 926.0, 592.0, 405.0, 283.0, 205.0, 151.0, 107.0, 86.0, 67.0, 45.0, 39.0, 26.0, 18.0, 16.0, 11.0, 8.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.4716796875, -1.426239013671875, -1.38079833984375, -1.335357666015625, -1.2899169921875, -1.244476318359375, -1.19903564453125, -1.153594970703125, -1.108154296875, -1.062713623046875, -1.01727294921875, -0.971832275390625, -0.9263916015625, -0.880950927734375, -0.83551025390625, -0.790069580078125, -0.74462890625, -0.699188232421875, -0.65374755859375, -0.608306884765625, -0.5628662109375, -0.517425537109375, -0.47198486328125, -0.426544189453125, -0.381103515625, -0.335662841796875, -0.29022216796875, -0.244781494140625, -0.1993408203125, -0.153900146484375, -0.10845947265625, -0.063018798828125, -0.017578125, 0.027862548828125, 0.07330322265625, 0.118743896484375, 0.1641845703125, 0.209625244140625, 0.25506591796875, 0.300506591796875, 0.345947265625, 0.391387939453125, 0.43682861328125, 0.482269287109375, 0.5277099609375, 0.573150634765625, 0.61859130859375, 0.664031982421875, 0.70947265625, 0.754913330078125, 0.80035400390625, 0.845794677734375, 0.8912353515625, 0.936676025390625, 0.98211669921875, 1.027557373046875, 1.072998046875, 1.118438720703125, 1.16387939453125, 1.209320068359375, 1.2547607421875, 1.300201416015625, 1.34564208984375, 1.391082763671875, 1.4365234375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 5.0, 7.0, 2.0, 12.0, 9.0, 12.0, 17.0, 13.0, 26.0, 19.0, 20.0, 35.0, 30.0, 32.0, 40.0, 40.0, 42.0, 60.0, 77.0, 220.0, 1505.0, 288.0, 102.0, 59.0, 59.0, 30.0, 28.0, 40.0, 29.0, 30.0, 25.0, 25.0, 19.0, 21.0, 12.0, 13.0, 7.0, 5.0, 8.0, 6.0, 1.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.76275634765625, -4.6075439453125, -4.45233154296875, -4.297119140625, -4.14190673828125, -3.9866943359375, -3.83148193359375, -3.67626953125, -3.52105712890625, -3.3658447265625, -3.21063232421875, -3.055419921875, -2.90020751953125, -2.7449951171875, -2.58978271484375, -2.4345703125, -2.27935791015625, -2.1241455078125, -1.96893310546875, -1.813720703125, -1.65850830078125, -1.5032958984375, -1.34808349609375, -1.19287109375, -1.03765869140625, -0.8824462890625, -0.72723388671875, -0.572021484375, -0.41680908203125, -0.2615966796875, -0.10638427734375, 0.048828125, 0.20404052734375, 0.3592529296875, 0.51446533203125, 0.669677734375, 0.82489013671875, 0.9801025390625, 1.13531494140625, 1.29052734375, 1.44573974609375, 1.6009521484375, 1.75616455078125, 1.911376953125, 2.06658935546875, 2.2218017578125, 2.37701416015625, 2.5322265625, 2.68743896484375, 2.8426513671875, 2.99786376953125, 3.153076171875, 3.30828857421875, 3.4635009765625, 3.61871337890625, 3.77392578125, 3.92913818359375, 4.0843505859375, 4.23956298828125, 4.394775390625, 4.54998779296875, 4.7052001953125, 4.86041259765625, 5.015625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 8.0, 9.0, 11.0, 9.0, 16.0, 23.0, 29.0, 30.0, 36.0, 51.0, 83.0, 98.0, 156.0, 293.0, 687.0, 2709.0, 42081.0, 2906076.0, 185113.0, 6097.0, 1011.0, 330.0, 198.0, 147.0, 97.0, 67.0, 47.0, 27.0, 37.0, 25.0, 23.0, 20.0, 8.0, 8.0, 5.0, 9.0, 5.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-10.1640625, -9.879150390625, -9.59423828125, -9.309326171875, -9.0244140625, -8.739501953125, -8.45458984375, -8.169677734375, -7.884765625, -7.599853515625, -7.31494140625, -7.030029296875, -6.7451171875, -6.460205078125, -6.17529296875, -5.890380859375, -5.60546875, -5.320556640625, -5.03564453125, -4.750732421875, -4.4658203125, -4.180908203125, -3.89599609375, -3.611083984375, -3.326171875, -3.041259765625, -2.75634765625, -2.471435546875, -2.1865234375, -1.901611328125, -1.61669921875, -1.331787109375, -1.046875, -0.761962890625, -0.47705078125, -0.192138671875, 0.0927734375, 0.377685546875, 0.66259765625, 0.947509765625, 1.232421875, 1.517333984375, 1.80224609375, 2.087158203125, 2.3720703125, 2.656982421875, 2.94189453125, 3.226806640625, 3.51171875, 3.796630859375, 4.08154296875, 4.366455078125, 4.6513671875, 4.936279296875, 5.22119140625, 5.506103515625, 5.791015625, 6.075927734375, 6.36083984375, 6.645751953125, 6.9306640625, 7.215576171875, 7.50048828125, 7.785400390625, 8.0703125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 20.0, 135.0, 366.0, 348.0, 122.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.35190200805664, -14.58341121673584, -13.814920425415039, -13.046428680419922, -12.277938842773438, -11.50944709777832, -10.74095630645752, -9.972465515136719, -9.203974723815918, -8.435483932495117, -7.666993141174316, -6.898501873016357, -6.130011081695557, -5.361520290374756, -4.593029022216797, -3.824538230895996, -3.0560474395751953, -2.2875566482543945, -1.5190656185150146, -0.7505745887756348, 0.017916202545166016, 0.7864069938659668, 1.5548982620239258, 2.3233890533447266, 3.0918798446655273, 3.860370635986328, 4.628861427307129, 5.397352695465088, 6.165843486785889, 6.9343342781066895, 7.702825546264648, 8.47131633758545, 9.23980712890625, 10.00829792022705, 10.776788711547852, 11.545280456542969, 12.313770294189453, 13.08226203918457, 13.850752830505371, 14.619243621826172, 15.387734413146973, 16.156225204467773, 16.92471694946289, 17.693206787109375, 18.461698532104492, 19.230188369750977, 19.998680114746094, 20.767169952392578, 21.535661697387695, 22.304153442382812, 23.072643280029297, 23.841135025024414, 24.6096248626709, 25.378116607666016, 26.1466064453125, 26.915098190307617, 27.683589935302734, 28.45208168029785, 29.220571517944336, 29.989063262939453, 30.757553100585938, 31.526044845581055, 32.29453659057617, 33.063026428222656, 33.83151626586914]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 10.0, 7.0, 18.0, 20.0, 15.0, 21.0, 23.0, 32.0, 18.0, 33.0, 38.0, 26.0, 46.0, 41.0, 35.0, 44.0, 34.0, 49.0, 57.0, 42.0, 30.0, 29.0, 33.0, 29.0, 37.0, 37.0, 31.0, 20.0, 19.0, 22.0, 14.0, 11.0, 9.0, 12.0, 11.0, 6.0, 7.0, 11.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.569936752319336, -17.070125579833984, -16.5703125, -16.07050132751465, -15.57068920135498, -15.070877075195312, -14.571064949035645, -14.071252822875977, -13.571441650390625, -13.071629524230957, -12.571817398071289, -12.072006225585938, -11.57219409942627, -11.072381973266602, -10.572569847106934, -10.072757720947266, -9.572946548461914, -9.073134422302246, -8.573322296142578, -8.073511123657227, -7.573698997497559, -7.073886871337891, -6.574074745178223, -6.074263095855713, -5.574450492858887, -5.074638366699219, -4.574826717376709, -4.075014591217041, -3.5752029418945312, -3.0753908157348633, -2.5755789279937744, -2.0757670402526855, -1.5759553909301758, -1.076143503189087, -0.5763315558433533, -0.07651960849761963, 0.42329227924346924, 0.9231042861938477, 1.4229161739349365, 1.9227280616760254, 2.4225399494171143, 2.922351837158203, 3.422163724899292, 3.921975612640381, 4.421787738800049, 4.921599388122559, 5.421411514282227, 5.9212236404418945, 6.421035289764404, 6.920847415924072, 7.420659065246582, 7.92047119140625, 8.420283317565918, 8.920095443725586, 9.419906616210938, 9.919718742370605, 10.419530868530273, 10.919342994689941, 11.41915512084961, 11.918966293334961, 12.418778419494629, 12.918590545654297, 13.418402671813965, 13.918214797973633, 14.418025970458984]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 11.0, 12.0, 15.0, 8.0, 15.0, 17.0, 16.0, 19.0, 20.0, 19.0, 27.0, 29.0, 39.0, 35.0, 35.0, 39.0, 34.0, 41.0, 48.0, 51.0, 35.0, 41.0, 35.0, 44.0, 36.0, 32.0, 36.0, 31.0, 20.0, 29.0, 24.0, 11.0, 19.0, 19.0, 5.0, 8.0, 9.0, 7.0, 5.0, 8.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6611328125, -1.6137237548828125, -1.566314697265625, -1.5189056396484375, -1.47149658203125, -1.4240875244140625, -1.376678466796875, -1.3292694091796875, -1.2818603515625, -1.2344512939453125, -1.187042236328125, -1.1396331787109375, -1.09222412109375, -1.0448150634765625, -0.997406005859375, -0.9499969482421875, -0.902587890625, -0.8551788330078125, -0.807769775390625, -0.7603607177734375, -0.71295166015625, -0.6655426025390625, -0.618133544921875, -0.5707244873046875, -0.5233154296875, -0.4759063720703125, -0.428497314453125, -0.3810882568359375, -0.33367919921875, -0.2862701416015625, -0.238861083984375, -0.1914520263671875, -0.14404296875, -0.0966339111328125, -0.049224853515625, -0.0018157958984375, 0.04559326171875, 0.0930023193359375, 0.140411376953125, 0.1878204345703125, 0.2352294921875, 0.2826385498046875, 0.330047607421875, 0.3774566650390625, 0.42486572265625, 0.4722747802734375, 0.519683837890625, 0.5670928955078125, 0.614501953125, 0.6619110107421875, 0.709320068359375, 0.7567291259765625, 0.80413818359375, 0.8515472412109375, 0.898956298828125, 0.9463653564453125, 0.9937744140625, 1.0411834716796875, 1.088592529296875, 1.1360015869140625, 1.18341064453125, 1.2308197021484375, 1.278228759765625, 1.3256378173828125, 1.373046875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 11.0, 8.0, 12.0, 19.0, 13.0, 14.0, 16.0, 11.0, 13.0, 27.0, 20.0, 35.0, 49.0, 69.0, 136.0, 369.0, 1585.0, 11554.0, 330566.0, 3574222.0, 262910.0, 10400.0, 1398.0, 357.0, 125.0, 50.0, 32.0, 37.0, 37.0, 28.0, 18.0, 27.0, 15.0, 15.0, 14.0, 14.0, 10.0, 5.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-7.87109375, -7.64276123046875, -7.4144287109375, -7.18609619140625, -6.957763671875, -6.72943115234375, -6.5010986328125, -6.27276611328125, -6.04443359375, -5.81610107421875, -5.5877685546875, -5.35943603515625, -5.131103515625, -4.90277099609375, -4.6744384765625, -4.44610595703125, -4.2177734375, -3.98944091796875, -3.7611083984375, -3.53277587890625, -3.304443359375, -3.07611083984375, -2.8477783203125, -2.61944580078125, -2.39111328125, -2.16278076171875, -1.9344482421875, -1.70611572265625, -1.477783203125, -1.24945068359375, -1.0211181640625, -0.79278564453125, -0.564453125, -0.33612060546875, -0.1077880859375, 0.12054443359375, 0.348876953125, 0.57720947265625, 0.8055419921875, 1.03387451171875, 1.26220703125, 1.49053955078125, 1.7188720703125, 1.94720458984375, 2.175537109375, 2.40386962890625, 2.6322021484375, 2.86053466796875, 3.0888671875, 3.31719970703125, 3.5455322265625, 3.77386474609375, 4.002197265625, 4.23052978515625, 4.4588623046875, 4.68719482421875, 4.91552734375, 5.14385986328125, 5.3721923828125, 5.60052490234375, 5.828857421875, 6.05718994140625, 6.2855224609375, 6.51385498046875, 6.7421875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 6.0, 15.0, 16.0, 30.0, 28.0, 45.0, 57.0, 82.0, 123.0, 174.0, 239.0, 286.0, 395.0, 487.0, 452.0, 392.0, 329.0, 262.0, 168.0, 132.0, 89.0, 63.0, 45.0, 36.0, 19.0, 27.0, 25.0, 10.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.138763427734375, -5.00018310546875, -4.861602783203125, -4.7230224609375, -4.584442138671875, -4.44586181640625, -4.307281494140625, -4.168701171875, -4.030120849609375, -3.89154052734375, -3.752960205078125, -3.6143798828125, -3.475799560546875, -3.33721923828125, -3.198638916015625, -3.06005859375, -2.921478271484375, -2.78289794921875, -2.644317626953125, -2.5057373046875, -2.367156982421875, -2.22857666015625, -2.089996337890625, -1.951416015625, -1.812835693359375, -1.67425537109375, -1.535675048828125, -1.3970947265625, -1.258514404296875, -1.11993408203125, -0.981353759765625, -0.8427734375, -0.704193115234375, -0.56561279296875, -0.427032470703125, -0.2884521484375, -0.149871826171875, -0.01129150390625, 0.127288818359375, 0.265869140625, 0.404449462890625, 0.54302978515625, 0.681610107421875, 0.8201904296875, 0.958770751953125, 1.09735107421875, 1.235931396484375, 1.37451171875, 1.513092041015625, 1.65167236328125, 1.790252685546875, 1.9288330078125, 2.067413330078125, 2.20599365234375, 2.344573974609375, 2.483154296875, 2.621734619140625, 2.76031494140625, 2.898895263671875, 3.0374755859375, 3.176055908203125, 3.31463623046875, 3.453216552734375, 3.591796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 12.0, 13.0, 18.0, 30.0, 30.0, 49.0, 42.0, 87.0, 125.0, 175.0, 289.0, 689.0, 2296.0, 16871.0, 521574.0, 3496196.0, 145684.0, 7594.0, 1375.0, 439.0, 243.0, 136.0, 91.0, 59.0, 43.0, 32.0, 26.0, 13.0, 12.0, 5.0, 10.0, 7.0, 4.0, 6.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.546875, -11.166259765625, -10.78564453125, -10.405029296875, -10.0244140625, -9.643798828125, -9.26318359375, -8.882568359375, -8.501953125, -8.121337890625, -7.74072265625, -7.360107421875, -6.9794921875, -6.598876953125, -6.21826171875, -5.837646484375, -5.45703125, -5.076416015625, -4.69580078125, -4.315185546875, -3.9345703125, -3.553955078125, -3.17333984375, -2.792724609375, -2.412109375, -2.031494140625, -1.65087890625, -1.270263671875, -0.8896484375, -0.509033203125, -0.12841796875, 0.252197265625, 0.6328125, 1.013427734375, 1.39404296875, 1.774658203125, 2.1552734375, 2.535888671875, 2.91650390625, 3.297119140625, 3.677734375, 4.058349609375, 4.43896484375, 4.819580078125, 5.2001953125, 5.580810546875, 5.96142578125, 6.342041015625, 6.72265625, 7.103271484375, 7.48388671875, 7.864501953125, 8.2451171875, 8.625732421875, 9.00634765625, 9.386962890625, 9.767578125, 10.148193359375, 10.52880859375, 10.909423828125, 11.2900390625, 11.670654296875, 12.05126953125, 12.431884765625, 12.8125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 14.0, 35.0, 38.0, 64.0, 90.0, 103.0, 111.0, 114.0, 101.0, 113.0, 81.0, 56.0, 31.0, 15.0, 18.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.88625717163086, -26.293231964111328, -25.700204849243164, -25.107179641723633, -24.51415252685547, -23.921127319335938, -23.328102111816406, -22.735076904296875, -22.14204978942871, -21.54902458190918, -20.955997467041016, -20.362972259521484, -19.769947052001953, -19.17691993713379, -18.583894729614258, -17.990867614746094, -17.397842407226562, -16.80481719970703, -16.211790084838867, -15.618764877319336, -15.025738716125488, -14.43271255493164, -13.83968734741211, -13.246661186218262, -12.653635025024414, -12.060608863830566, -11.467582702636719, -10.874557495117188, -10.28153133392334, -9.688505172729492, -9.095479965209961, -8.502453804016113, -7.909427642822266, -7.316401481628418, -6.7233757972717285, -6.130350112915039, -5.537323951721191, -4.944297790527344, -4.351272106170654, -3.758246421813965, -3.165220260620117, -2.5721943378448486, -1.97916841506958, -1.3861424922943115, -0.793116569519043, -0.20009064674377441, 0.39293527603149414, 0.9859609603881836, 1.5789871215820312, 2.1720130443573, 2.7650389671325684, 3.358064889907837, 3.9510908126831055, 4.544116973876953, 5.137142658233643, 5.730168342590332, 6.32319450378418, 6.916220664978027, 7.509246349334717, 8.102272033691406, 8.695298194885254, 9.288324356079102, 9.881349563598633, 10.47437572479248, 11.067401885986328]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 8.0, 7.0, 9.0, 15.0, 16.0, 15.0, 17.0, 13.0, 23.0, 29.0, 24.0, 13.0, 34.0, 33.0, 36.0, 34.0, 40.0, 38.0, 43.0, 40.0, 44.0, 40.0, 39.0, 38.0, 36.0, 36.0, 33.0, 34.0, 23.0, 24.0, 23.0, 25.0, 13.0, 12.0, 20.0, 10.0, 8.0, 14.0, 9.0, 10.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.997387886047363, -13.576021194458008, -13.154654502868652, -12.733287811279297, -12.311921119689941, -11.890554428100586, -11.46918773651123, -11.047821044921875, -10.62645435333252, -10.205087661743164, -9.783720970153809, -9.362354278564453, -8.940987586975098, -8.519620895385742, -8.098254203796387, -7.676887512207031, -7.255520820617676, -6.83415412902832, -6.412787437438965, -5.991420745849609, -5.570054054260254, -5.148687362670898, -4.727320671081543, -4.3059539794921875, -3.884587287902832, -3.4632205963134766, -3.041853904724121, -2.6204872131347656, -2.19912052154541, -1.7777538299560547, -1.3563871383666992, -0.9350204467773438, -0.5136528015136719, -0.0922861099243164, 0.32908058166503906, 0.7504472732543945, 1.17181396484375, 1.5931806564331055, 2.014547348022461, 2.4359140396118164, 2.857280731201172, 3.2786474227905273, 3.700014114379883, 4.121380805969238, 4.542747497558594, 4.964114189147949, 5.385480880737305, 5.80684757232666, 6.228214263916016, 6.649580955505371, 7.070947647094727, 7.492314338684082, 7.9136810302734375, 8.335047721862793, 8.756414413452148, 9.177781105041504, 9.59914779663086, 10.020514488220215, 10.44188117980957, 10.863247871398926, 11.284614562988281, 11.705981254577637, 12.127347946166992, 12.548714637756348, 12.970081329345703]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 10.0, 12.0, 10.0, 12.0, 11.0, 12.0, 14.0, 21.0, 19.0, 22.0, 23.0, 24.0, 29.0, 37.0, 44.0, 42.0, 41.0, 56.0, 50.0, 41.0, 36.0, 36.0, 37.0, 36.0, 32.0, 30.0, 31.0, 36.0, 26.0, 19.0, 24.0, 16.0, 22.0, 19.0, 9.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.48046875, -1.432861328125, -1.38525390625, -1.337646484375, -1.2900390625, -1.242431640625, -1.19482421875, -1.147216796875, -1.099609375, -1.052001953125, -1.00439453125, -0.956787109375, -0.9091796875, -0.861572265625, -0.81396484375, -0.766357421875, -0.71875, -0.671142578125, -0.62353515625, -0.575927734375, -0.5283203125, -0.480712890625, -0.43310546875, -0.385498046875, -0.337890625, -0.290283203125, -0.24267578125, -0.195068359375, -0.1474609375, -0.099853515625, -0.05224609375, -0.004638671875, 0.04296875, 0.090576171875, 0.13818359375, 0.185791015625, 0.2333984375, 0.281005859375, 0.32861328125, 0.376220703125, 0.423828125, 0.471435546875, 0.51904296875, 0.566650390625, 0.6142578125, 0.661865234375, 0.70947265625, 0.757080078125, 0.8046875, 0.852294921875, 0.89990234375, 0.947509765625, 0.9951171875, 1.042724609375, 1.09033203125, 1.137939453125, 1.185546875, 1.233154296875, 1.28076171875, 1.328369140625, 1.3759765625, 1.423583984375, 1.47119140625, 1.518798828125, 1.56640625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 4.0, 2.0, 1.0, 7.0, 12.0, 24.0, 36.0, 53.0, 53.0, 81.0, 104.0, 204.0, 262.0, 357.0, 471.0, 791.0, 1041.0, 1410.0, 2155.0, 2995.0, 4470.0, 6467.0, 9337.0, 13712.0, 19804.0, 30293.0, 47804.0, 79826.0, 151319.0, 284248.0, 160944.0, 82863.0, 49716.0, 31570.0, 21018.0, 14095.0, 9522.0, 6596.0, 4553.0, 3095.0, 2191.0, 1494.0, 1028.0, 774.0, 527.0, 354.0, 263.0, 202.0, 135.0, 86.0, 46.0, 51.0, 37.0, 24.0, 12.0, 7.0, 3.0, 7.0, 3.0, 3.0, 1.0, 3.0], "bins": [-0.251220703125, -0.243255615234375, -0.23529052734375, -0.227325439453125, -0.2193603515625, -0.211395263671875, -0.20343017578125, -0.195465087890625, -0.1875, -0.179534912109375, -0.17156982421875, -0.163604736328125, -0.1556396484375, -0.147674560546875, -0.13970947265625, -0.131744384765625, -0.123779296875, -0.115814208984375, -0.10784912109375, -0.099884033203125, -0.0919189453125, -0.083953857421875, -0.07598876953125, -0.068023681640625, -0.06005859375, -0.052093505859375, -0.04412841796875, -0.036163330078125, -0.0281982421875, -0.020233154296875, -0.01226806640625, -0.004302978515625, 0.003662109375, 0.011627197265625, 0.01959228515625, 0.027557373046875, 0.0355224609375, 0.043487548828125, 0.05145263671875, 0.059417724609375, 0.0673828125, 0.075347900390625, 0.08331298828125, 0.091278076171875, 0.0992431640625, 0.107208251953125, 0.11517333984375, 0.123138427734375, 0.131103515625, 0.139068603515625, 0.14703369140625, 0.154998779296875, 0.1629638671875, 0.170928955078125, 0.17889404296875, 0.186859130859375, 0.19482421875, 0.202789306640625, 0.21075439453125, 0.218719482421875, 0.2266845703125, 0.234649658203125, 0.24261474609375, 0.250579833984375, 0.258544921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 8.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 11.0, 11.0, 13.0, 12.0, 10.0, 20.0, 36.0, 21.0, 28.0, 34.0, 31.0, 34.0, 41.0, 38.0, 35.0, 31.0, 40.0, 45.0, 1062.0, 30.0, 29.0, 36.0, 35.0, 26.0, 25.0, 30.0, 34.0, 27.0, 33.0, 20.0, 18.0, 16.0, 19.0, 13.0, 10.0, 5.0, 7.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8505859375, -0.821502685546875, -0.79241943359375, -0.763336181640625, -0.7342529296875, -0.705169677734375, -0.67608642578125, -0.647003173828125, -0.617919921875, -0.588836669921875, -0.55975341796875, -0.530670166015625, -0.5015869140625, -0.472503662109375, -0.44342041015625, -0.414337158203125, -0.38525390625, -0.356170654296875, -0.32708740234375, -0.298004150390625, -0.2689208984375, -0.239837646484375, -0.21075439453125, -0.181671142578125, -0.152587890625, -0.123504638671875, -0.09442138671875, -0.065338134765625, -0.0362548828125, -0.007171630859375, 0.02191162109375, 0.050994873046875, 0.080078125, 0.109161376953125, 0.13824462890625, 0.167327880859375, 0.1964111328125, 0.225494384765625, 0.25457763671875, 0.283660888671875, 0.312744140625, 0.341827392578125, 0.37091064453125, 0.399993896484375, 0.4290771484375, 0.458160400390625, 0.48724365234375, 0.516326904296875, 0.54541015625, 0.574493408203125, 0.60357666015625, 0.632659912109375, 0.6617431640625, 0.690826416015625, 0.71990966796875, 0.748992919921875, 0.778076171875, 0.807159423828125, 0.83624267578125, 0.865325927734375, 0.8944091796875, 0.923492431640625, 0.95257568359375, 0.981658935546875, 1.0107421875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 9.0, 9.0, 13.0, 17.0, 31.0, 51.0, 81.0, 122.0, 211.0, 275.0, 388.0, 597.0, 874.0, 1207.0, 1760.0, 2634.0, 3800.0, 5842.0, 8817.0, 13471.0, 20994.0, 32780.0, 54578.0, 94291.0, 186839.0, 1331382.0, 136924.0, 75695.0, 44536.0, 27501.0, 17494.0, 11323.0, 7310.0, 4874.0, 3359.0, 2299.0, 1469.0, 1062.0, 763.0, 459.0, 345.0, 195.0, 164.0, 105.0, 59.0, 49.0, 31.0, 17.0, 14.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24951171875, -0.24127578735351562, -0.23303985595703125, -0.22480392456054688, -0.2165679931640625, -0.20833206176757812, -0.20009613037109375, -0.19186019897460938, -0.183624267578125, -0.17538833618164062, -0.16715240478515625, -0.15891647338867188, -0.1506805419921875, -0.14244461059570312, -0.13420867919921875, -0.12597274780273438, -0.11773681640625, -0.10950088500976562, -0.10126495361328125, -0.09302902221679688, -0.0847930908203125, -0.07655715942382812, -0.06832122802734375, -0.060085296630859375, -0.051849365234375, -0.043613433837890625, -0.03537750244140625, -0.027141571044921875, -0.0189056396484375, -0.010669708251953125, -0.00243377685546875, 0.005802154541015625, 0.0140380859375, 0.022274017333984375, 0.03050994873046875, 0.038745880126953125, 0.0469818115234375, 0.055217742919921875, 0.06345367431640625, 0.07168960571289062, 0.079925537109375, 0.08816146850585938, 0.09639739990234375, 0.10463333129882812, 0.1128692626953125, 0.12110519409179688, 0.12934112548828125, 0.13757705688476562, 0.14581298828125, 0.15404891967773438, 0.16228485107421875, 0.17052078247070312, 0.1787567138671875, 0.18699264526367188, 0.19522857666015625, 0.20346450805664062, 0.211700439453125, 0.21993637084960938, 0.22817230224609375, 0.23640823364257812, 0.2446441650390625, 0.2528800964355469, 0.26111602783203125, 0.2693519592285156, 0.277587890625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 7.0, 11.0, 11.0, 11.0, 10.0, 19.0, 14.0, 30.0, 31.0, 36.0, 53.0, 42.0, 37.0, 48.0, 63.0, 49.0, 46.0, 41.0, 39.0, 46.0, 49.0, 46.0, 37.0, 36.0, 29.0, 25.0, 18.0, 17.0, 18.0, 13.0, 12.0, 8.0, 9.0, 9.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.00016367435455322266, -0.00015834160149097443, -0.0001530088484287262, -0.00014767609536647797, -0.00014234334230422974, -0.0001370105892419815, -0.00013167783617973328, -0.00012634508311748505, -0.00012101233005523682, -0.00011567957699298859, -0.00011034682393074036, -0.00010501407086849213, -9.96813178062439e-05, -9.434856474399567e-05, -8.901581168174744e-05, -8.36830586194992e-05, -7.835030555725098e-05, -7.301755249500275e-05, -6.768479943275452e-05, -6.235204637050629e-05, -5.701929330825806e-05, -5.168654024600983e-05, -4.63537871837616e-05, -4.102103412151337e-05, -3.568828105926514e-05, -3.0355527997016907e-05, -2.5022774934768677e-05, -1.9690021872520447e-05, -1.4357268810272217e-05, -9.024515748023987e-06, -3.691762685775757e-06, 1.6409903764724731e-06, 6.973743438720703e-06, 1.2306496500968933e-05, 1.7639249563217163e-05, 2.2972002625465393e-05, 2.8304755687713623e-05, 3.363750874996185e-05, 3.897026181221008e-05, 4.430301487445831e-05, 4.963576793670654e-05, 5.496852099895477e-05, 6.0301274061203e-05, 6.563402712345123e-05, 7.096678018569946e-05, 7.629953324794769e-05, 8.163228631019592e-05, 8.696503937244415e-05, 9.229779243469238e-05, 9.763054549694061e-05, 0.00010296329855918884, 0.00010829605162143707, 0.0001136288046836853, 0.00011896155774593353, 0.00012429431080818176, 0.00012962706387043, 0.00013495981693267822, 0.00014029256999492645, 0.00014562532305717468, 0.0001509580761194229, 0.00015629082918167114, 0.00016162358224391937, 0.0001669563353061676, 0.00017228908836841583, 0.00017762184143066406]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 11.0, 9.0, 12.0, 23.0, 18.0, 25.0, 41.0, 45.0, 57.0, 71.0, 106.0, 109.0, 167.0, 275.0, 324.0, 613.0, 3339.0, 942681.0, 97947.0, 1150.0, 443.0, 254.0, 208.0, 116.0, 120.0, 93.0, 86.0, 54.0, 34.0, 31.0, 11.0, 13.0, 17.0, 10.0, 7.0, 7.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0031909942626953125, -0.00308382511138916, -0.002976655960083008, -0.0028694868087768555, -0.002762317657470703, -0.0026551485061645508, -0.0025479793548583984, -0.002440810203552246, -0.0023336410522460938, -0.0022264719009399414, -0.002119302749633789, -0.0020121335983276367, -0.0019049644470214844, -0.001797795295715332, -0.0016906261444091797, -0.0015834569931030273, -0.001476287841796875, -0.0013691186904907227, -0.0012619495391845703, -0.001154780387878418, -0.0010476112365722656, -0.0009404420852661133, -0.0008332729339599609, -0.0007261037826538086, -0.0006189346313476562, -0.0005117654800415039, -0.00040459632873535156, -0.0002974271774291992, -0.00019025802612304688, -8.308887481689453e-05, 2.4080276489257812e-05, 0.00013124942779541016, 0.0002384185791015625, 0.00034558773040771484, 0.0004527568817138672, 0.0005599260330200195, 0.0006670951843261719, 0.0007742643356323242, 0.0008814334869384766, 0.000988602638244629, 0.0010957717895507812, 0.0012029409408569336, 0.001310110092163086, 0.0014172792434692383, 0.0015244483947753906, 0.001631617546081543, 0.0017387866973876953, 0.0018459558486938477, 0.001953125, 0.0020602941513061523, 0.0021674633026123047, 0.002274632453918457, 0.0023818016052246094, 0.0024889707565307617, 0.002596139907836914, 0.0027033090591430664, 0.0028104782104492188, 0.002917647361755371, 0.0030248165130615234, 0.0031319856643676758, 0.003239154815673828, 0.0033463239669799805, 0.003453493118286133, 0.003560662269592285, 0.0036678314208984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 119.0, 523.0, 309.0, 49.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010006871307268739, -0.000982757075689733, -0.0009648269042372704, -0.0009468968492001295, -0.0009289667359553277, -0.000911036622710526, -0.0008931065676733851, -0.0008751764544285834, -0.0008572463411837816, -0.0008393162279389799, -0.0008213861146941781, -0.0008034560596570373, -0.0007855259464122355, -0.0007675958331674337, -0.0007496657781302929, -0.0007317356648854911, -0.0007138055516406894, -0.0006958754383958876, -0.0006779453251510859, -0.000660015270113945, -0.0006420851568691432, -0.0006241550436243415, -0.0006062249885872006, -0.0005882948753423989, -0.0005703647620975971, -0.0005524346488527954, -0.0005345045356079936, -0.0005165744805708528, -0.000498644367326051, -0.00048071425408124924, -0.00046278416994027793, -0.00044485408579930663, -0.00042692391434684396, -0.0004089938011020422, -0.0003910637169610709, -0.0003731336328200996, -0.00035520351957529783, -0.00033727340633049607, -0.00031934332218952477, -0.00030141323804855347, -0.0002834831248037517, -0.00026555301155894995, -0.00024762292741797864, -0.0002296928287250921, -0.00021176273003220558, -0.00019383263133931905, -0.00017590253264643252, -0.000157972433953546, -0.00014004234981257468, -0.00012211225111968815, -0.00010418215242680162, -8.625205373391509e-05, -6.832195504102856e-05, -5.039185634814203e-05, -3.2461757655255497e-05, -1.4531658962368965e-05, 3.398439730517566e-06, 2.1328538423404098e-05, 3.925863711629063e-05, 5.718873580917716e-05, 7.511883450206369e-05, 9.304893319495022e-05, 0.00011097903188783675, 0.00012890913058072329, 0.00014683922927360982]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 12.0, 12.0, 11.0, 14.0, 19.0, 19.0, 23.0, 41.0, 20.0, 22.0, 32.0, 35.0, 29.0, 38.0, 35.0, 50.0, 45.0, 35.0, 48.0, 44.0, 42.0, 37.0, 37.0, 41.0, 33.0, 20.0, 27.0, 26.0, 24.0, 19.0, 19.0, 19.0, 10.0, 1.0, 14.0, 8.0, 2.0, 5.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0], "bins": [-0.00011289119720458984, -0.00010976940393447876, -0.00010664761066436768, -0.00010352581739425659, -0.00010040402412414551, -9.728223085403442e-05, -9.416043758392334e-05, -9.103864431381226e-05, -8.791685104370117e-05, -8.479505777359009e-05, -8.1673264503479e-05, -7.855147123336792e-05, -7.542967796325684e-05, -7.230788469314575e-05, -6.918609142303467e-05, -6.606429815292358e-05, -6.29425048828125e-05, -5.9820711612701416e-05, -5.669891834259033e-05, -5.357712507247925e-05, -5.0455331802368164e-05, -4.733353853225708e-05, -4.4211745262145996e-05, -4.108995199203491e-05, -3.796815872192383e-05, -3.4846365451812744e-05, -3.172457218170166e-05, -2.8602778911590576e-05, -2.5480985641479492e-05, -2.2359192371368408e-05, -1.9237399101257324e-05, -1.611560583114624e-05, -1.2993812561035156e-05, -9.872019290924072e-06, -6.750226020812988e-06, -3.6284327507019043e-06, -5.066394805908203e-07, 2.6151537895202637e-06, 5.736947059631348e-06, 8.858740329742432e-06, 1.1980533599853516e-05, 1.51023268699646e-05, 1.8224120140075684e-05, 2.1345913410186768e-05, 2.446770668029785e-05, 2.7589499950408936e-05, 3.071129322052002e-05, 3.3833086490631104e-05, 3.695487976074219e-05, 4.007667303085327e-05, 4.3198466300964355e-05, 4.632025957107544e-05, 4.9442052841186523e-05, 5.256384611129761e-05, 5.568563938140869e-05, 5.8807432651519775e-05, 6.192922592163086e-05, 6.505101919174194e-05, 6.817281246185303e-05, 7.129460573196411e-05, 7.44163990020752e-05, 7.753819227218628e-05, 8.065998554229736e-05, 8.378177881240845e-05, 8.690357208251953e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 10.0, 12.0, 10.0, 12.0, 11.0, 12.0, 14.0, 21.0, 19.0, 22.0, 23.0, 24.0, 29.0, 37.0, 44.0, 42.0, 41.0, 56.0, 50.0, 41.0, 36.0, 36.0, 37.0, 36.0, 32.0, 30.0, 31.0, 36.0, 26.0, 19.0, 24.0, 16.0, 22.0, 19.0, 9.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.48046875, -1.432861328125, -1.38525390625, -1.337646484375, -1.2900390625, -1.242431640625, -1.19482421875, -1.147216796875, -1.099609375, -1.052001953125, -1.00439453125, -0.956787109375, -0.9091796875, -0.861572265625, -0.81396484375, -0.766357421875, -0.71875, -0.671142578125, -0.62353515625, -0.575927734375, -0.5283203125, -0.480712890625, -0.43310546875, -0.385498046875, -0.337890625, -0.290283203125, -0.24267578125, -0.195068359375, -0.1474609375, -0.099853515625, -0.05224609375, -0.004638671875, 0.04296875, 0.090576171875, 0.13818359375, 0.185791015625, 0.2333984375, 0.281005859375, 0.32861328125, 0.376220703125, 0.423828125, 0.471435546875, 0.51904296875, 0.566650390625, 0.6142578125, 0.661865234375, 0.70947265625, 0.757080078125, 0.8046875, 0.852294921875, 0.89990234375, 0.947509765625, 0.9951171875, 1.042724609375, 1.09033203125, 1.137939453125, 1.185546875, 1.233154296875, 1.28076171875, 1.328369140625, 1.3759765625, 1.423583984375, 1.47119140625, 1.518798828125, 1.56640625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 7.0, 5.0, 12.0, 10.0, 16.0, 30.0, 32.0, 38.0, 55.0, 95.0, 98.0, 154.0, 207.0, 337.0, 478.0, 789.0, 1611.0, 3246.0, 7989.0, 24446.0, 97705.0, 381692.0, 389632.0, 99418.0, 25117.0, 8116.0, 3231.0, 1514.0, 829.0, 556.0, 324.0, 200.0, 162.0, 111.0, 74.0, 61.0, 36.0, 35.0, 21.0, 22.0, 12.0, 8.0, 7.0, 4.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.044921875, -1.976776123046875, -1.90863037109375, -1.840484619140625, -1.7723388671875, -1.704193115234375, -1.63604736328125, -1.567901611328125, -1.499755859375, -1.431610107421875, -1.36346435546875, -1.295318603515625, -1.2271728515625, -1.159027099609375, -1.09088134765625, -1.022735595703125, -0.95458984375, -0.886444091796875, -0.81829833984375, -0.750152587890625, -0.6820068359375, -0.613861083984375, -0.54571533203125, -0.477569580078125, -0.409423828125, -0.341278076171875, -0.27313232421875, -0.204986572265625, -0.1368408203125, -0.068695068359375, -0.00054931640625, 0.067596435546875, 0.1357421875, 0.203887939453125, 0.27203369140625, 0.340179443359375, 0.4083251953125, 0.476470947265625, 0.54461669921875, 0.612762451171875, 0.680908203125, 0.749053955078125, 0.81719970703125, 0.885345458984375, 0.9534912109375, 1.021636962890625, 1.08978271484375, 1.157928466796875, 1.22607421875, 1.294219970703125, 1.36236572265625, 1.430511474609375, 1.4986572265625, 1.566802978515625, 1.63494873046875, 1.703094482421875, 1.771240234375, 1.839385986328125, 1.90753173828125, 1.975677490234375, 2.0438232421875, 2.111968994140625, 2.18011474609375, 2.248260498046875, 2.31640625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 6.0, 5.0, 11.0, 13.0, 11.0, 12.0, 12.0, 16.0, 28.0, 23.0, 24.0, 27.0, 34.0, 27.0, 40.0, 35.0, 60.0, 83.0, 112.0, 338.0, 1463.0, 152.0, 80.0, 58.0, 48.0, 52.0, 34.0, 34.0, 21.0, 18.0, 27.0, 19.0, 17.0, 18.0, 15.0, 11.0, 8.0, 10.0, 11.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -4.99981689453125, -4.8394775390625, -4.67913818359375, -4.518798828125, -4.35845947265625, -4.1981201171875, -4.03778076171875, -3.87744140625, -3.71710205078125, -3.5567626953125, -3.39642333984375, -3.236083984375, -3.07574462890625, -2.9154052734375, -2.75506591796875, -2.5947265625, -2.43438720703125, -2.2740478515625, -2.11370849609375, -1.953369140625, -1.79302978515625, -1.6326904296875, -1.47235107421875, -1.31201171875, -1.15167236328125, -0.9913330078125, -0.83099365234375, -0.670654296875, -0.51031494140625, -0.3499755859375, -0.18963623046875, -0.029296875, 0.13104248046875, 0.2913818359375, 0.45172119140625, 0.612060546875, 0.77239990234375, 0.9327392578125, 1.09307861328125, 1.25341796875, 1.41375732421875, 1.5740966796875, 1.73443603515625, 1.894775390625, 2.05511474609375, 2.2154541015625, 2.37579345703125, 2.5361328125, 2.69647216796875, 2.8568115234375, 3.01715087890625, 3.177490234375, 3.33782958984375, 3.4981689453125, 3.65850830078125, 3.81884765625, 3.97918701171875, 4.1395263671875, 4.29986572265625, 4.460205078125, 4.62054443359375, 4.7808837890625, 4.94122314453125, 5.1015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 11.0, 8.0, 6.0, 17.0, 19.0, 27.0, 33.0, 41.0, 54.0, 63.0, 87.0, 154.0, 301.0, 705.0, 3112.0, 73598.0, 3022724.0, 40903.0, 2447.0, 592.0, 270.0, 168.0, 82.0, 66.0, 56.0, 34.0, 27.0, 18.0, 24.0, 20.0, 8.0, 6.0, 7.0, 12.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.72900390625, -10.3876953125, -10.04638671875, -9.705078125, -9.36376953125, -9.0224609375, -8.68115234375, -8.33984375, -7.99853515625, -7.6572265625, -7.31591796875, -6.974609375, -6.63330078125, -6.2919921875, -5.95068359375, -5.609375, -5.26806640625, -4.9267578125, -4.58544921875, -4.244140625, -3.90283203125, -3.5615234375, -3.22021484375, -2.87890625, -2.53759765625, -2.1962890625, -1.85498046875, -1.513671875, -1.17236328125, -0.8310546875, -0.48974609375, -0.1484375, 0.19287109375, 0.5341796875, 0.87548828125, 1.216796875, 1.55810546875, 1.8994140625, 2.24072265625, 2.58203125, 2.92333984375, 3.2646484375, 3.60595703125, 3.947265625, 4.28857421875, 4.6298828125, 4.97119140625, 5.3125, 5.65380859375, 5.9951171875, 6.33642578125, 6.677734375, 7.01904296875, 7.3603515625, 7.70166015625, 8.04296875, 8.38427734375, 8.7255859375, 9.06689453125, 9.408203125, 9.74951171875, 10.0908203125, 10.43212890625, 10.7734375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [16.0, 441.0, 548.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.105020523071289, -2.1163346767425537, -0.12764883041381836, 1.861037254333496, 3.8497228622436523, 5.838408470153809, 7.827095031738281, 9.815780639648438, 11.804466247558594, 13.79315185546875, 15.781837463378906, 17.770523071289062, 19.75920867919922, 21.747894287109375, 23.736581802368164, 25.72526741027832, 27.713953018188477, 29.702638626098633, 31.69132423400879, 33.68001174926758, 35.668697357177734, 37.65738296508789, 39.64606857299805, 41.6347541809082, 43.62343978881836, 45.612125396728516, 47.60081100463867, 49.58949661254883, 51.578182220458984, 53.56686782836914, 55.55555725097656, 57.54424285888672, 59.532928466796875, 61.52161407470703, 63.51029968261719, 65.49898529052734, 67.4876708984375, 69.47635650634766, 71.46504211425781, 73.45372772216797, 75.44241333007812, 77.43109893798828, 79.41978454589844, 81.4084701538086, 83.39715576171875, 85.3858413696289, 87.37452697753906, 89.36321258544922, 91.35189819335938, 93.34058380126953, 95.32926940917969, 97.31795501708984, 99.306640625, 101.29532623291016, 103.28401184082031, 105.27269744873047, 107.26139068603516, 109.25007629394531, 111.23876190185547, 113.22744750976562, 115.21613311767578, 117.20481872558594, 119.1935043334961, 121.18218994140625, 123.1708755493164]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 8.0, 9.0, 8.0, 11.0, 11.0, 17.0, 20.0, 20.0, 21.0, 26.0, 26.0, 28.0, 27.0, 24.0, 21.0, 36.0, 26.0, 42.0, 37.0, 39.0, 38.0, 29.0, 41.0, 48.0, 38.0, 29.0, 35.0, 32.0, 27.0, 30.0, 31.0, 23.0, 11.0, 15.0, 19.0, 13.0, 19.0, 13.0, 13.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.06462860107422, -15.56001091003418, -15.05539321899414, -14.550775527954102, -14.046157836914062, -13.541540145874023, -13.036921501159668, -12.532303810119629, -12.02768611907959, -11.52306842803955, -11.018450736999512, -10.513833045959473, -10.009214401245117, -9.504596710205078, -8.999979019165039, -8.495361328125, -7.990743637084961, -7.486125946044922, -6.981508255004883, -6.4768900871276855, -5.9722723960876465, -5.467654705047607, -4.96303653717041, -4.458418846130371, -3.953801155090332, -3.449183464050293, -2.944565534591675, -2.4399476051330566, -1.9353299140930176, -1.4307122230529785, -0.9260942935943604, -0.4214763641357422, 0.08314132690429688, 0.5877591371536255, 1.092376947402954, 1.5969947576522827, 2.1016125679016113, 2.6062302589416504, 3.1108481884002686, 3.6154661178588867, 4.120083808898926, 4.624701499938965, 5.129319190979004, 5.633937358856201, 6.13855504989624, 6.643172740936279, 7.147790908813477, 7.652408599853516, 8.157026290893555, 8.661643981933594, 9.166261672973633, 9.670879364013672, 10.175497055053711, 10.68011474609375, 11.184733390808105, 11.689351081848145, 12.193968772888184, 12.698586463928223, 13.203204154968262, 13.7078218460083, 14.212440490722656, 14.717058181762695, 15.221675872802734, 15.726293563842773, 16.230911254882812]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 8.0, 10.0, 10.0, 9.0, 12.0, 9.0, 14.0, 12.0, 18.0, 21.0, 18.0, 10.0, 20.0, 33.0, 21.0, 42.0, 32.0, 46.0, 41.0, 56.0, 50.0, 38.0, 44.0, 34.0, 43.0, 38.0, 29.0, 22.0, 35.0, 27.0, 31.0, 24.0, 30.0, 26.0, 14.0, 25.0, 7.0, 7.0, 9.0, 4.0, 1.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5673828125, -1.5173492431640625, -1.467315673828125, -1.4172821044921875, -1.36724853515625, -1.3172149658203125, -1.267181396484375, -1.2171478271484375, -1.1671142578125, -1.1170806884765625, -1.067047119140625, -1.0170135498046875, -0.96697998046875, -0.9169464111328125, -0.866912841796875, -0.8168792724609375, -0.766845703125, -0.7168121337890625, -0.666778564453125, -0.6167449951171875, -0.56671142578125, -0.5166778564453125, -0.466644287109375, -0.4166107177734375, -0.3665771484375, -0.3165435791015625, -0.266510009765625, -0.2164764404296875, -0.16644287109375, -0.1164093017578125, -0.066375732421875, -0.0163421630859375, 0.03369140625, 0.0837249755859375, 0.133758544921875, 0.1837921142578125, 0.23382568359375, 0.2838592529296875, 0.333892822265625, 0.3839263916015625, 0.4339599609375, 0.4839935302734375, 0.534027099609375, 0.5840606689453125, 0.63409423828125, 0.6841278076171875, 0.734161376953125, 0.7841949462890625, 0.834228515625, 0.8842620849609375, 0.934295654296875, 0.9843292236328125, 1.03436279296875, 1.0843963623046875, 1.134429931640625, 1.1844635009765625, 1.2344970703125, 1.2845306396484375, 1.334564208984375, 1.3845977783203125, 1.43463134765625, 1.4846649169921875, 1.534698486328125, 1.5847320556640625, 1.634765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 6.0, 6.0, 14.0, 8.0, 8.0, 19.0, 22.0, 17.0, 22.0, 44.0, 70.0, 116.0, 179.0, 371.0, 833.0, 2289.0, 7603.0, 33281.0, 211460.0, 1460883.0, 2016106.0, 389176.0, 54733.0, 11623.0, 3252.0, 1105.0, 433.0, 203.0, 115.0, 82.0, 52.0, 41.0, 25.0, 13.0, 19.0, 12.0, 5.0, 8.0, 11.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.376953125, -3.264923095703125, -3.15289306640625, -3.040863037109375, -2.9288330078125, -2.816802978515625, -2.70477294921875, -2.592742919921875, -2.480712890625, -2.368682861328125, -2.25665283203125, -2.144622802734375, -2.0325927734375, -1.920562744140625, -1.80853271484375, -1.696502685546875, -1.58447265625, -1.472442626953125, -1.36041259765625, -1.248382568359375, -1.1363525390625, -1.024322509765625, -0.91229248046875, -0.800262451171875, -0.688232421875, -0.576202392578125, -0.46417236328125, -0.352142333984375, -0.2401123046875, -0.128082275390625, -0.01605224609375, 0.095977783203125, 0.2080078125, 0.320037841796875, 0.43206787109375, 0.544097900390625, 0.6561279296875, 0.768157958984375, 0.88018798828125, 0.992218017578125, 1.104248046875, 1.216278076171875, 1.32830810546875, 1.440338134765625, 1.5523681640625, 1.664398193359375, 1.77642822265625, 1.888458251953125, 2.00048828125, 2.112518310546875, 2.22454833984375, 2.336578369140625, 2.4486083984375, 2.560638427734375, 2.67266845703125, 2.784698486328125, 2.896728515625, 3.008758544921875, 3.12078857421875, 3.232818603515625, 3.3448486328125, 3.456878662109375, 3.56890869140625, 3.680938720703125, 3.79296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 7.0, 17.0, 11.0, 15.0, 31.0, 39.0, 40.0, 70.0, 73.0, 119.0, 142.0, 190.0, 265.0, 301.0, 405.0, 389.0, 419.0, 306.0, 286.0, 223.0, 154.0, 135.0, 97.0, 87.0, 53.0, 55.0, 28.0, 26.0, 20.0, 10.0, 10.0, 12.0, 5.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7578125, -3.63153076171875, -3.5052490234375, -3.37896728515625, -3.252685546875, -3.12640380859375, -3.0001220703125, -2.87384033203125, -2.74755859375, -2.62127685546875, -2.4949951171875, -2.36871337890625, -2.242431640625, -2.11614990234375, -1.9898681640625, -1.86358642578125, -1.7373046875, -1.61102294921875, -1.4847412109375, -1.35845947265625, -1.232177734375, -1.10589599609375, -0.9796142578125, -0.85333251953125, -0.72705078125, -0.60076904296875, -0.4744873046875, -0.34820556640625, -0.221923828125, -0.09564208984375, 0.0306396484375, 0.15692138671875, 0.283203125, 0.40948486328125, 0.5357666015625, 0.66204833984375, 0.788330078125, 0.91461181640625, 1.0408935546875, 1.16717529296875, 1.29345703125, 1.41973876953125, 1.5460205078125, 1.67230224609375, 1.798583984375, 1.92486572265625, 2.0511474609375, 2.17742919921875, 2.3037109375, 2.42999267578125, 2.5562744140625, 2.68255615234375, 2.808837890625, 2.93511962890625, 3.0614013671875, 3.18768310546875, 3.31396484375, 3.44024658203125, 3.5665283203125, 3.69281005859375, 3.819091796875, 3.94537353515625, 4.0716552734375, 4.19793701171875, 4.32421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 10.0, 12.0, 23.0, 35.0, 55.0, 97.0, 172.0, 478.0, 2740.0, 153447.0, 3952261.0, 82074.0, 2082.0, 415.0, 165.0, 99.0, 50.0, 20.0, 22.0, 8.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.53125, -23.9532470703125, -23.375244140625, -22.7972412109375, -22.21923828125, -21.6412353515625, -21.063232421875, -20.4852294921875, -19.9072265625, -19.3292236328125, -18.751220703125, -18.1732177734375, -17.59521484375, -17.0172119140625, -16.439208984375, -15.8612060546875, -15.283203125, -14.7052001953125, -14.127197265625, -13.5491943359375, -12.97119140625, -12.3931884765625, -11.815185546875, -11.2371826171875, -10.6591796875, -10.0811767578125, -9.503173828125, -8.9251708984375, -8.34716796875, -7.7691650390625, -7.191162109375, -6.6131591796875, -6.03515625, -5.4571533203125, -4.879150390625, -4.3011474609375, -3.72314453125, -3.1451416015625, -2.567138671875, -1.9891357421875, -1.4111328125, -0.8331298828125, -0.255126953125, 0.3228759765625, 0.90087890625, 1.4788818359375, 2.056884765625, 2.6348876953125, 3.212890625, 3.7908935546875, 4.368896484375, 4.9468994140625, 5.52490234375, 6.1029052734375, 6.680908203125, 7.2589111328125, 7.8369140625, 8.4149169921875, 8.992919921875, 9.5709228515625, 10.14892578125, 10.7269287109375, 11.304931640625, 11.8829345703125, 12.4609375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 14.0, 42.0, 75.0, 109.0, 184.0, 195.0, 167.0, 115.0, 57.0, 30.0, 12.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.153446197509766, -42.1279411315918, -41.102439880371094, -40.076934814453125, -39.051429748535156, -38.02592468261719, -37.00041961669922, -35.974918365478516, -34.94941329956055, -33.92390823364258, -32.898406982421875, -31.872901916503906, -30.847396850585938, -29.82189178466797, -28.796388626098633, -27.770885467529297, -26.745380401611328, -25.71987533569336, -24.694372177124023, -23.668869018554688, -22.64336395263672, -21.61785888671875, -20.592355728149414, -19.566852569580078, -18.54134750366211, -17.51584243774414, -16.490339279174805, -15.464835166931152, -14.4393310546875, -13.413826942443848, -12.388322830200195, -11.362818717956543, -10.33731460571289, -9.311810493469238, -8.286306381225586, -7.260802268981934, -6.235298156738281, -5.209794044494629, -4.184289932250977, -3.158785820007324, -2.133281707763672, -1.1077775955200195, -0.08227348327636719, 0.9432306289672852, 1.9687347412109375, 2.99423885345459, 4.019742965698242, 5.0452470779418945, 6.070751190185547, 7.096255302429199, 8.121759414672852, 9.147263526916504, 10.172767639160156, 11.198271751403809, 12.223775863647461, 13.249279975891113, 14.274784088134766, 15.300288200378418, 16.32579231262207, 17.351295471191406, 18.376800537109375, 19.402305603027344, 20.42780876159668, 21.453311920166016, 22.478816986083984]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 7.0, 10.0, 9.0, 15.0, 11.0, 18.0, 25.0, 18.0, 24.0, 23.0, 36.0, 29.0, 26.0, 24.0, 31.0, 44.0, 28.0, 33.0, 30.0, 36.0, 42.0, 41.0, 39.0, 45.0, 31.0, 42.0, 33.0, 29.0, 29.0, 21.0, 28.0, 27.0, 16.0, 18.0, 18.0, 17.0, 8.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.86210823059082, -12.397945404052734, -11.933783531188965, -11.469621658325195, -11.00545883178711, -10.541296005249023, -10.077134132385254, -9.612972259521484, -9.148809432983398, -8.684646606445312, -8.220484733581543, -7.756322383880615, -7.2921600341796875, -6.82799768447876, -6.363835334777832, -5.899672985076904, -5.435510635375977, -4.971348285675049, -4.507185935974121, -4.043023586273193, -3.5788612365722656, -3.114698886871338, -2.65053653717041, -2.1863741874694824, -1.7222118377685547, -1.258049488067627, -0.7938871383666992, -0.3297247886657715, 0.13443756103515625, 0.598599910736084, 1.0627622604370117, 1.5269246101379395, 1.9910869598388672, 2.455249309539795, 2.9194116592407227, 3.3835740089416504, 3.847736358642578, 4.311898708343506, 4.776061058044434, 5.240223407745361, 5.704385757446289, 6.168548107147217, 6.6327104568481445, 7.096872806549072, 7.56103515625, 8.025197982788086, 8.489359855651855, 8.953521728515625, 9.417684555053711, 9.881847381591797, 10.346009254455566, 10.810171127319336, 11.274333953857422, 11.738496780395508, 12.202658653259277, 12.666820526123047, 13.130983352661133, 13.595146179199219, 14.059308052062988, 14.523469924926758, 14.987632751464844, 15.45179557800293, 15.9159574508667, 16.38011932373047, 16.844282150268555]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 5.0, 11.0, 7.0, 10.0, 10.0, 16.0, 12.0, 15.0, 15.0, 18.0, 11.0, 22.0, 33.0, 27.0, 34.0, 41.0, 36.0, 32.0, 40.0, 52.0, 35.0, 39.0, 30.0, 36.0, 42.0, 40.0, 40.0, 28.0, 34.0, 22.0, 23.0, 26.0, 21.0, 25.0, 19.0, 15.0, 9.0, 12.0, 8.0, 7.0, 4.0, 4.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.669921875, -1.621978759765625, -1.57403564453125, -1.526092529296875, -1.4781494140625, -1.430206298828125, -1.38226318359375, -1.334320068359375, -1.286376953125, -1.238433837890625, -1.19049072265625, -1.142547607421875, -1.0946044921875, -1.046661376953125, -0.99871826171875, -0.950775146484375, -0.90283203125, -0.854888916015625, -0.80694580078125, -0.759002685546875, -0.7110595703125, -0.663116455078125, -0.61517333984375, -0.567230224609375, -0.519287109375, -0.471343994140625, -0.42340087890625, -0.375457763671875, -0.3275146484375, -0.279571533203125, -0.23162841796875, -0.183685302734375, -0.1357421875, -0.087799072265625, -0.03985595703125, 0.008087158203125, 0.0560302734375, 0.103973388671875, 0.15191650390625, 0.199859619140625, 0.247802734375, 0.295745849609375, 0.34368896484375, 0.391632080078125, 0.4395751953125, 0.487518310546875, 0.53546142578125, 0.583404541015625, 0.63134765625, 0.679290771484375, 0.72723388671875, 0.775177001953125, 0.8231201171875, 0.871063232421875, 0.91900634765625, 0.966949462890625, 1.014892578125, 1.062835693359375, 1.11077880859375, 1.158721923828125, 1.2066650390625, 1.254608154296875, 1.30255126953125, 1.350494384765625, 1.3984375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 15.0, 9.0, 16.0, 29.0, 46.0, 53.0, 113.0, 162.0, 219.0, 289.0, 438.0, 569.0, 797.0, 1077.0, 1569.0, 2122.0, 2902.0, 4109.0, 5914.0, 8265.0, 11448.0, 16411.0, 23927.0, 35521.0, 55488.0, 90266.0, 160143.0, 239834.0, 144633.0, 82602.0, 50952.0, 32832.0, 22306.0, 15197.0, 10939.0, 7751.0, 5525.0, 4006.0, 2856.0, 2023.0, 1432.0, 1141.0, 810.0, 513.0, 450.0, 235.0, 197.0, 146.0, 86.0, 57.0, 64.0, 26.0, 17.0, 10.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.24109649658203125, -0.2331695556640625, -0.22524261474609375, -0.217315673828125, -0.20938873291015625, -0.2014617919921875, -0.19353485107421875, -0.18560791015625, -0.17768096923828125, -0.1697540283203125, -0.16182708740234375, -0.153900146484375, -0.14597320556640625, -0.1380462646484375, -0.13011932373046875, -0.1221923828125, -0.11426544189453125, -0.1063385009765625, -0.09841156005859375, -0.090484619140625, -0.08255767822265625, -0.0746307373046875, -0.06670379638671875, -0.05877685546875, -0.05084991455078125, -0.0429229736328125, -0.03499603271484375, -0.027069091796875, -0.01914215087890625, -0.0112152099609375, -0.00328826904296875, 0.004638671875, 0.01256561279296875, 0.0204925537109375, 0.02841949462890625, 0.036346435546875, 0.04427337646484375, 0.0522003173828125, 0.06012725830078125, 0.06805419921875, 0.07598114013671875, 0.0839080810546875, 0.09183502197265625, 0.099761962890625, 0.10768890380859375, 0.1156158447265625, 0.12354278564453125, 0.1314697265625, 0.13939666748046875, 0.1473236083984375, 0.15525054931640625, 0.163177490234375, 0.17110443115234375, 0.1790313720703125, 0.18695831298828125, 0.19488525390625, 0.20281219482421875, 0.2107391357421875, 0.21866607666015625, 0.226593017578125, 0.23451995849609375, 0.2424468994140625, 0.25037384033203125, 0.25830078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 7.0, 10.0, 7.0, 6.0, 11.0, 15.0, 19.0, 20.0, 25.0, 23.0, 33.0, 28.0, 19.0, 31.0, 40.0, 46.0, 31.0, 42.0, 49.0, 1058.0, 35.0, 44.0, 31.0, 52.0, 32.0, 32.0, 32.0, 28.0, 22.0, 21.0, 18.0, 18.0, 20.0, 24.0, 18.0, 14.0, 10.0, 8.0, 10.0, 6.0, 7.0, 1.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.025390625, -0.9940109252929688, -0.9626312255859375, -0.9312515258789062, -0.899871826171875, -0.8684921264648438, -0.8371124267578125, -0.8057327270507812, -0.77435302734375, -0.7429733276367188, -0.7115936279296875, -0.6802139282226562, -0.648834228515625, -0.6174545288085938, -0.5860748291015625, -0.5546951293945312, -0.5233154296875, -0.49193572998046875, -0.4605560302734375, -0.42917633056640625, -0.397796630859375, -0.36641693115234375, -0.3350372314453125, -0.30365753173828125, -0.27227783203125, -0.24089813232421875, -0.2095184326171875, -0.17813873291015625, -0.146759033203125, -0.11537933349609375, -0.0839996337890625, -0.05261993408203125, -0.021240234375, 0.01013946533203125, 0.0415191650390625, 0.07289886474609375, 0.104278564453125, 0.13565826416015625, 0.1670379638671875, 0.19841766357421875, 0.22979736328125, 0.26117706298828125, 0.2925567626953125, 0.32393646240234375, 0.355316162109375, 0.38669586181640625, 0.4180755615234375, 0.44945526123046875, 0.4808349609375, 0.5122146606445312, 0.5435943603515625, 0.5749740600585938, 0.606353759765625, 0.6377334594726562, 0.6691131591796875, 0.7004928588867188, 0.73187255859375, 0.7632522583007812, 0.7946319580078125, 0.8260116577148438, 0.857391357421875, 0.8887710571289062, 0.9201507568359375, 0.9515304565429688, 0.98291015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 9.0, 8.0, 10.0, 15.0, 19.0, 47.0, 53.0, 81.0, 130.0, 216.0, 274.0, 368.0, 621.0, 902.0, 1223.0, 1823.0, 2626.0, 4053.0, 5755.0, 8518.0, 12679.0, 18980.0, 29341.0, 47612.0, 82815.0, 161117.0, 1337754.0, 162145.0, 83089.0, 47815.0, 29637.0, 18921.0, 12262.0, 8278.0, 5640.0, 3751.0, 2665.0, 1791.0, 1293.0, 845.0, 637.0, 427.0, 269.0, 199.0, 145.0, 91.0, 74.0, 37.0, 33.0, 18.0, 9.0, 12.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.27685546875, -0.2683372497558594, -0.25981903076171875, -0.2513008117675781, -0.2427825927734375, -0.23426437377929688, -0.22574615478515625, -0.21722793579101562, -0.208709716796875, -0.20019149780273438, -0.19167327880859375, -0.18315505981445312, -0.1746368408203125, -0.16611862182617188, -0.15760040283203125, -0.14908218383789062, -0.14056396484375, -0.13204574584960938, -0.12352752685546875, -0.11500930786132812, -0.1064910888671875, -0.09797286987304688, -0.08945465087890625, -0.08093643188476562, -0.072418212890625, -0.06389999389648438, -0.05538177490234375, -0.046863555908203125, -0.0383453369140625, -0.029827117919921875, -0.02130889892578125, -0.012790679931640625, -0.0042724609375, 0.004245758056640625, 0.01276397705078125, 0.021282196044921875, 0.0298004150390625, 0.038318634033203125, 0.04683685302734375, 0.055355072021484375, 0.063873291015625, 0.07239151000976562, 0.08090972900390625, 0.08942794799804688, 0.0979461669921875, 0.10646438598632812, 0.11498260498046875, 0.12350082397460938, 0.13201904296875, 0.14053726196289062, 0.14905548095703125, 0.15757369995117188, 0.1660919189453125, 0.17461013793945312, 0.18312835693359375, 0.19164657592773438, 0.200164794921875, 0.20868301391601562, 0.21720123291015625, 0.22571945190429688, 0.2342376708984375, 0.24275588989257812, 0.25127410888671875, 0.2597923278808594, 0.268310546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 14.0, 14.0, 14.0, 15.0, 18.0, 22.0, 28.0, 37.0, 37.0, 33.0, 62.0, 50.0, 51.0, 49.0, 67.0, 47.0, 54.0, 50.0, 48.0, 42.0, 36.0, 40.0, 24.0, 30.0, 20.0, 17.0, 15.0, 7.0, 6.0, 3.0, 8.0, 2.0, 9.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013875961303710938, -0.0001340322196483612, -0.00012930482625961304, -0.00012457743287086487, -0.0001198500394821167, -0.00011512264609336853, -0.00011039525270462036, -0.00010566785931587219, -0.00010094046592712402, -9.621307253837585e-05, -9.148567914962769e-05, -8.675828576087952e-05, -8.203089237213135e-05, -7.730349898338318e-05, -7.257610559463501e-05, -6.784871220588684e-05, -6.312131881713867e-05, -5.83939254283905e-05, -5.3666532039642334e-05, -4.8939138650894165e-05, -4.4211745262145996e-05, -3.948435187339783e-05, -3.475695848464966e-05, -3.002956509590149e-05, -2.530217170715332e-05, -2.057477831840515e-05, -1.5847384929656982e-05, -1.1119991540908813e-05, -6.3925981521606445e-06, -1.6652047634124756e-06, 3.0621886253356934e-06, 7.789582014083862e-06, 1.2516975402832031e-05, 1.72443687915802e-05, 2.197176218032837e-05, 2.6699155569076538e-05, 3.142654895782471e-05, 3.6153942346572876e-05, 4.0881335735321045e-05, 4.5608729124069214e-05, 5.033612251281738e-05, 5.506351590156555e-05, 5.979090929031372e-05, 6.451830267906189e-05, 6.924569606781006e-05, 7.397308945655823e-05, 7.87004828453064e-05, 8.342787623405457e-05, 8.815526962280273e-05, 9.28826630115509e-05, 9.761005640029907e-05, 0.00010233744978904724, 0.00010706484317779541, 0.00011179223656654358, 0.00011651962995529175, 0.00012124702334403992, 0.00012597441673278809, 0.00013070181012153625, 0.00013542920351028442, 0.0001401565968990326, 0.00014488399028778076, 0.00014961138367652893, 0.0001543387770652771, 0.00015906617045402527, 0.00016379356384277344]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 12.0, 6.0, 13.0, 5.0, 9.0, 16.0, 12.0, 36.0, 44.0, 64.0, 67.0, 101.0, 162.0, 187.0, 282.0, 483.0, 999.0, 80256.0, 957159.0, 6674.0, 659.0, 392.0, 249.0, 173.0, 119.0, 82.0, 63.0, 59.0, 33.0, 26.0, 26.0, 16.0, 13.0, 14.0, 11.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0032215118408203125, -0.0031276047229766846, -0.0030336976051330566, -0.0029397904872894287, -0.0028458833694458008, -0.002751976251602173, -0.002658069133758545, -0.002564162015914917, -0.002470254898071289, -0.002376347780227661, -0.002282440662384033, -0.0021885335445404053, -0.0020946264266967773, -0.0020007193088531494, -0.0019068121910095215, -0.0018129050731658936, -0.0017189979553222656, -0.0016250908374786377, -0.0015311837196350098, -0.0014372766017913818, -0.001343369483947754, -0.001249462366104126, -0.001155555248260498, -0.0010616481304168701, -0.0009677410125732422, -0.0008738338947296143, -0.0007799267768859863, -0.0006860196590423584, -0.0005921125411987305, -0.0004982054233551025, -0.0004042983055114746, -0.0003103911876678467, -0.00021648406982421875, -0.00012257695198059082, -2.866983413696289e-05, 6.523728370666504e-05, 0.00015914440155029297, 0.0002530515193939209, 0.00034695863723754883, 0.00044086575508117676, 0.0005347728729248047, 0.0006286799907684326, 0.0007225871086120605, 0.0008164942264556885, 0.0009104013442993164, 0.0010043084621429443, 0.0010982155799865723, 0.0011921226978302002, 0.0012860298156738281, 0.001379936933517456, 0.001473844051361084, 0.001567751169204712, 0.0016616582870483398, 0.0017555654048919678, 0.0018494725227355957, 0.0019433796405792236, 0.0020372867584228516, 0.0021311938762664795, 0.0022251009941101074, 0.0023190081119537354, 0.0024129152297973633, 0.002506822347640991, 0.002600729465484619, 0.002694636583328247, 0.002788543701171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 65.0, 299.0, 409.0, 196.0, 30.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004159118980169296, -0.0004017203173134476, -0.00038752873660996556, -0.00037333715590648353, -0.0003591455752030015, -0.00034495399449951947, -0.00033076241379603744, -0.00031657086219638586, -0.00030237925238907337, -0.00028818767168559134, -0.0002739960909821093, -0.0002598045102786273, -0.00024561292957514524, -0.0002314213488716632, -0.0002172297827200964, -0.00020303820201661438, -0.00018884663586504757, -0.00017465505516156554, -0.0001604634744580835, -0.00014627189375460148, -0.00013208031305111945, -0.00011788873962359503, -0.00010369716619607061, -8.950558549258858e-05, -7.531400478910655e-05, -6.112242408562452e-05, -4.693084702012129e-05, -3.2739269954618067e-05, -1.8547689251136035e-05, -4.356108547654003e-06, 9.835464879870415e-06, 2.4027045583352447e-05, 3.821862628683448e-05, 5.241020699031651e-05, 6.660178769379854e-05, 8.079336112132296e-05, 9.498494182480499e-05, 0.00010917652252828702, 0.00012336809595581144, 0.00013755967665929347, 0.0001517512573627755, 0.00016594283806625754, 0.00018013441876973957, 0.00019432598492130637, 0.0002085175656247884, 0.00022270914632827044, 0.00023690072703175247, 0.0002510923077352345, 0.00026528388843871653, 0.00027947546914219856, 0.0002936670498456806, 0.0003078586305491626, 0.00032205021125264466, 0.0003362417919561267, 0.00035043334355577826, 0.00036462495336309075, 0.00037881650496274233, 0.00039300808566622436, 0.0004071996663697064, 0.0004213912470731884, 0.00043558282777667046, 0.0004497744084801525, 0.0004639659891836345, 0.0004781575407832861, 0.0004923491505905986]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 5.0, 12.0, 15.0, 21.0, 20.0, 22.0, 34.0, 40.0, 36.0, 38.0, 41.0, 40.0, 37.0, 43.0, 43.0, 47.0, 35.0, 39.0, 50.0, 48.0, 35.0, 39.0, 35.0, 34.0, 26.0, 21.0, 24.0, 18.0, 20.0, 15.0, 11.0, 14.0, 10.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.690357208251953e-05, -8.42418521642685e-05, -8.158013224601746e-05, -7.891841232776642e-05, -7.625669240951538e-05, -7.359497249126434e-05, -7.09332525730133e-05, -6.827153265476227e-05, -6.560981273651123e-05, -6.294809281826019e-05, -6.0286372900009155e-05, -5.762465298175812e-05, -5.496293306350708e-05, -5.230121314525604e-05, -4.9639493227005005e-05, -4.697777330875397e-05, -4.431605339050293e-05, -4.165433347225189e-05, -3.8992613554000854e-05, -3.633089363574982e-05, -3.366917371749878e-05, -3.100745379924774e-05, -2.8345733880996704e-05, -2.5684013962745667e-05, -2.302229404449463e-05, -2.036057412624359e-05, -1.7698854207992554e-05, -1.5037134289741516e-05, -1.2375414371490479e-05, -9.713694453239441e-06, -7.051974534988403e-06, -4.390254616737366e-06, -1.7285346984863281e-06, 9.331852197647095e-07, 3.594905138015747e-06, 6.256625056266785e-06, 8.918344974517822e-06, 1.158006489276886e-05, 1.4241784811019897e-05, 1.6903504729270935e-05, 1.9565224647521973e-05, 2.222694456577301e-05, 2.4888664484024048e-05, 2.7550384402275085e-05, 3.0212104320526123e-05, 3.287382423877716e-05, 3.55355441570282e-05, 3.8197264075279236e-05, 4.0858983993530273e-05, 4.352070391178131e-05, 4.618242383003235e-05, 4.8844143748283386e-05, 5.1505863666534424e-05, 5.416758358478546e-05, 5.68293035030365e-05, 5.949102342128754e-05, 6.215274333953857e-05, 6.481446325778961e-05, 6.747618317604065e-05, 7.013790309429169e-05, 7.279962301254272e-05, 7.546134293079376e-05, 7.81230628490448e-05, 8.078478276729584e-05, 8.344650268554688e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 5.0, 11.0, 7.0, 10.0, 10.0, 16.0, 12.0, 15.0, 15.0, 18.0, 11.0, 22.0, 33.0, 27.0, 34.0, 41.0, 36.0, 32.0, 40.0, 52.0, 35.0, 39.0, 30.0, 36.0, 42.0, 40.0, 40.0, 28.0, 34.0, 22.0, 23.0, 26.0, 21.0, 25.0, 19.0, 15.0, 9.0, 12.0, 8.0, 7.0, 4.0, 4.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.669921875, -1.621978759765625, -1.57403564453125, -1.526092529296875, -1.4781494140625, -1.430206298828125, -1.38226318359375, -1.334320068359375, -1.286376953125, -1.238433837890625, -1.19049072265625, -1.142547607421875, -1.0946044921875, -1.046661376953125, -0.99871826171875, -0.950775146484375, -0.90283203125, -0.854888916015625, -0.80694580078125, -0.759002685546875, -0.7110595703125, -0.663116455078125, -0.61517333984375, -0.567230224609375, -0.519287109375, -0.471343994140625, -0.42340087890625, -0.375457763671875, -0.3275146484375, -0.279571533203125, -0.23162841796875, -0.183685302734375, -0.1357421875, -0.087799072265625, -0.03985595703125, 0.008087158203125, 0.0560302734375, 0.103973388671875, 0.15191650390625, 0.199859619140625, 0.247802734375, 0.295745849609375, 0.34368896484375, 0.391632080078125, 0.4395751953125, 0.487518310546875, 0.53546142578125, 0.583404541015625, 0.63134765625, 0.679290771484375, 0.72723388671875, 0.775177001953125, 0.8231201171875, 0.871063232421875, 0.91900634765625, 0.966949462890625, 1.014892578125, 1.062835693359375, 1.11077880859375, 1.158721923828125, 1.2066650390625, 1.254608154296875, 1.30255126953125, 1.350494384765625, 1.3984375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 7.0, 7.0, 12.0, 16.0, 24.0, 20.0, 42.0, 54.0, 84.0, 110.0, 183.0, 287.0, 433.0, 708.0, 1186.0, 1847.0, 3170.0, 5639.0, 10444.0, 21015.0, 43724.0, 91790.0, 175495.0, 250345.0, 209469.0, 118205.0, 57007.0, 26961.0, 13308.0, 7014.0, 3871.0, 2297.0, 1350.0, 877.0, 528.0, 336.0, 231.0, 156.0, 96.0, 60.0, 46.0, 25.0, 22.0, 16.0, 7.0, 8.0, 7.0, 10.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2685546875, -1.229736328125, -1.19091796875, -1.152099609375, -1.11328125, -1.074462890625, -1.03564453125, -0.996826171875, -0.9580078125, -0.919189453125, -0.88037109375, -0.841552734375, -0.802734375, -0.763916015625, -0.72509765625, -0.686279296875, -0.6474609375, -0.608642578125, -0.56982421875, -0.531005859375, -0.4921875, -0.453369140625, -0.41455078125, -0.375732421875, -0.3369140625, -0.298095703125, -0.25927734375, -0.220458984375, -0.181640625, -0.142822265625, -0.10400390625, -0.065185546875, -0.0263671875, 0.012451171875, 0.05126953125, 0.090087890625, 0.12890625, 0.167724609375, 0.20654296875, 0.245361328125, 0.2841796875, 0.322998046875, 0.36181640625, 0.400634765625, 0.439453125, 0.478271484375, 0.51708984375, 0.555908203125, 0.5947265625, 0.633544921875, 0.67236328125, 0.711181640625, 0.75, 0.788818359375, 0.82763671875, 0.866455078125, 0.9052734375, 0.944091796875, 0.98291015625, 1.021728515625, 1.060546875, 1.099365234375, 1.13818359375, 1.177001953125, 1.2158203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 10.0, 9.0, 10.0, 14.0, 14.0, 14.0, 14.0, 18.0, 22.0, 18.0, 30.0, 34.0, 36.0, 42.0, 36.0, 39.0, 80.0, 170.0, 336.0, 1387.0, 185.0, 90.0, 57.0, 50.0, 36.0, 36.0, 35.0, 21.0, 31.0, 18.0, 26.0, 24.0, 13.0, 13.0, 13.0, 15.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.84765625, -5.6761474609375, -5.504638671875, -5.3331298828125, -5.16162109375, -4.9901123046875, -4.818603515625, -4.6470947265625, -4.4755859375, -4.3040771484375, -4.132568359375, -3.9610595703125, -3.78955078125, -3.6180419921875, -3.446533203125, -3.2750244140625, -3.103515625, -2.9320068359375, -2.760498046875, -2.5889892578125, -2.41748046875, -2.2459716796875, -2.074462890625, -1.9029541015625, -1.7314453125, -1.5599365234375, -1.388427734375, -1.2169189453125, -1.04541015625, -0.8739013671875, -0.702392578125, -0.5308837890625, -0.359375, -0.1878662109375, -0.016357421875, 0.1551513671875, 0.32666015625, 0.4981689453125, 0.669677734375, 0.8411865234375, 1.0126953125, 1.1842041015625, 1.355712890625, 1.5272216796875, 1.69873046875, 1.8702392578125, 2.041748046875, 2.2132568359375, 2.384765625, 2.5562744140625, 2.727783203125, 2.8992919921875, 3.07080078125, 3.2423095703125, 3.413818359375, 3.5853271484375, 3.7568359375, 3.9283447265625, 4.099853515625, 4.2713623046875, 4.44287109375, 4.6143798828125, 4.785888671875, 4.9573974609375, 5.12890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 14.0, 15.0, 11.0, 17.0, 19.0, 24.0, 30.0, 47.0, 62.0, 72.0, 94.0, 123.0, 225.0, 454.0, 1225.0, 8544.0, 469153.0, 2633216.0, 28648.0, 2122.0, 631.0, 267.0, 187.0, 118.0, 87.0, 62.0, 38.0, 32.0, 33.0, 24.0, 23.0, 17.0, 14.0, 12.0, 5.0, 6.0, 4.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1778564453125, -8.863525390625, -8.5491943359375, -8.23486328125, -7.9205322265625, -7.606201171875, -7.2918701171875, -6.9775390625, -6.6632080078125, -6.348876953125, -6.0345458984375, -5.72021484375, -5.4058837890625, -5.091552734375, -4.7772216796875, -4.462890625, -4.1485595703125, -3.834228515625, -3.5198974609375, -3.20556640625, -2.8912353515625, -2.576904296875, -2.2625732421875, -1.9482421875, -1.6339111328125, -1.319580078125, -1.0052490234375, -0.69091796875, -0.3765869140625, -0.062255859375, 0.2520751953125, 0.56640625, 0.8807373046875, 1.195068359375, 1.5093994140625, 1.82373046875, 2.1380615234375, 2.452392578125, 2.7667236328125, 3.0810546875, 3.3953857421875, 3.709716796875, 4.0240478515625, 4.33837890625, 4.6527099609375, 4.967041015625, 5.2813720703125, 5.595703125, 5.9100341796875, 6.224365234375, 6.5386962890625, 6.85302734375, 7.1673583984375, 7.481689453125, 7.7960205078125, 8.1103515625, 8.4246826171875, 8.739013671875, 9.0533447265625, 9.36767578125, 9.6820068359375, 9.996337890625, 10.3106689453125, 10.625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 125.0, 449.0, 360.0, 64.0, 9.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.02841186523438, -70.76129913330078, -69.49418640136719, -68.2270736694336, -66.95996856689453, -65.69285583496094, -64.42574310302734, -63.15863037109375, -61.891517639160156, -60.62440490722656, -59.357295989990234, -58.09018325805664, -56.82307052612305, -55.55595779418945, -54.288848876953125, -53.02173614501953, -51.75462341308594, -50.487510681152344, -49.220401763916016, -47.95328903198242, -46.68617630004883, -45.419063568115234, -44.151954650878906, -42.88484191894531, -41.617733001708984, -40.35062026977539, -39.08351135253906, -37.81639862060547, -36.549285888671875, -35.28217315673828, -34.01506423950195, -32.74795150756836, -31.4808349609375, -30.21372413635254, -28.946611404418945, -27.679500579833984, -26.41238784790039, -25.14527702331543, -23.87816619873047, -22.611053466796875, -21.343942642211914, -20.076831817626953, -18.80971908569336, -17.5426082611084, -16.275495529174805, -15.008384704589844, -13.741272926330566, -12.474161148071289, -11.207049369812012, -9.939937591552734, -8.672825813293457, -7.405714511871338, -6.1386027336120605, -4.871490955352783, -3.604379653930664, -2.3372678756713867, -1.0701560974121094, 0.19695556163787842, 1.4640672206878662, 2.7311787605285645, 3.998290538787842, 5.265402317047119, 6.532513618469238, 7.799625396728516, 9.066737174987793]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 4.0, 4.0, 10.0, 6.0, 8.0, 8.0, 10.0, 12.0, 20.0, 26.0, 19.0, 32.0, 28.0, 35.0, 27.0, 38.0, 35.0, 33.0, 58.0, 57.0, 48.0, 55.0, 53.0, 52.0, 45.0, 36.0, 49.0, 28.0, 30.0, 19.0, 25.0, 20.0, 16.0, 5.0, 14.0, 10.0, 10.0, 8.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34966278076172, -22.683855056762695, -22.018049240112305, -21.35224151611328, -20.68643569946289, -20.020627975463867, -19.354822158813477, -18.689014434814453, -18.023208618164062, -17.35740089416504, -16.69159507751465, -16.025787353515625, -15.359981536865234, -14.694174766540527, -14.02836799621582, -13.362560272216797, -12.69675350189209, -12.030946731567383, -11.365139961242676, -10.699333190917969, -10.033526420593262, -9.367719650268555, -8.701911926269531, -8.03610610961914, -7.370298862457275, -6.704492092132568, -6.038685321807861, -5.372878074645996, -4.707071304321289, -4.041264533996582, -3.375457763671875, -2.709650993347168, -2.043844223022461, -1.378037452697754, -0.7122305631637573, -0.04642367362976074, 0.6193830966949463, 1.2851898670196533, 1.9509968757629395, 2.6168036460876465, 3.2826104164123535, 3.9484171867370605, 4.614223957061768, 5.280031204223633, 5.94583797454834, 6.611644744873047, 7.277451515197754, 7.943258285522461, 8.609065055847168, 9.274871826171875, 9.940678596496582, 10.606485366821289, 11.272292137145996, 11.938098907470703, 12.603906631469727, 13.269712448120117, 13.93552017211914, 14.601326942443848, 15.267133712768555, 15.932940483093262, 16.59874725341797, 17.264554977416992, 17.930360794067383, 18.596168518066406, 19.261974334716797]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 3.0, 6.0, 10.0, 5.0, 9.0, 6.0, 10.0, 17.0, 16.0, 17.0, 11.0, 19.0, 23.0, 23.0, 23.0, 32.0, 33.0, 33.0, 38.0, 38.0, 51.0, 44.0, 44.0, 42.0, 37.0, 31.0, 43.0, 32.0, 23.0, 44.0, 30.0, 26.0, 30.0, 27.0, 17.0, 19.0, 19.0, 14.0, 13.0, 10.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8212890625, -1.768798828125, -1.71630859375, -1.663818359375, -1.611328125, -1.558837890625, -1.50634765625, -1.453857421875, -1.4013671875, -1.348876953125, -1.29638671875, -1.243896484375, -1.19140625, -1.138916015625, -1.08642578125, -1.033935546875, -0.9814453125, -0.928955078125, -0.87646484375, -0.823974609375, -0.771484375, -0.718994140625, -0.66650390625, -0.614013671875, -0.5615234375, -0.509033203125, -0.45654296875, -0.404052734375, -0.3515625, -0.299072265625, -0.24658203125, -0.194091796875, -0.1416015625, -0.089111328125, -0.03662109375, 0.015869140625, 0.068359375, 0.120849609375, 0.17333984375, 0.225830078125, 0.2783203125, 0.330810546875, 0.38330078125, 0.435791015625, 0.48828125, 0.540771484375, 0.59326171875, 0.645751953125, 0.6982421875, 0.750732421875, 0.80322265625, 0.855712890625, 0.908203125, 0.960693359375, 1.01318359375, 1.065673828125, 1.1181640625, 1.170654296875, 1.22314453125, 1.275634765625, 1.328125, 1.380615234375, 1.43310546875, 1.485595703125, 1.5380859375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 8.0, 5.0, 4.0, 9.0, 4.0, 6.0, 9.0, 14.0, 13.0, 14.0, 16.0, 30.0, 29.0, 32.0, 54.0, 89.0, 113.0, 172.0, 373.0, 990.0, 3548.0, 18383.0, 149730.0, 1502618.0, 2180789.0, 298345.0, 30909.0, 5402.0, 1369.0, 509.0, 225.0, 136.0, 80.0, 51.0, 47.0, 36.0, 34.0, 18.0, 18.0, 13.0, 7.0, 10.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.609375, -4.47027587890625, -4.3311767578125, -4.19207763671875, -4.052978515625, -3.91387939453125, -3.7747802734375, -3.63568115234375, -3.49658203125, -3.35748291015625, -3.2183837890625, -3.07928466796875, -2.940185546875, -2.80108642578125, -2.6619873046875, -2.52288818359375, -2.3837890625, -2.24468994140625, -2.1055908203125, -1.96649169921875, -1.827392578125, -1.68829345703125, -1.5491943359375, -1.41009521484375, -1.27099609375, -1.13189697265625, -0.9927978515625, -0.85369873046875, -0.714599609375, -0.57550048828125, -0.4364013671875, -0.29730224609375, -0.158203125, -0.01910400390625, 0.1199951171875, 0.25909423828125, 0.398193359375, 0.53729248046875, 0.6763916015625, 0.81549072265625, 0.95458984375, 1.09368896484375, 1.2327880859375, 1.37188720703125, 1.510986328125, 1.65008544921875, 1.7891845703125, 1.92828369140625, 2.0673828125, 2.20648193359375, 2.3455810546875, 2.48468017578125, 2.623779296875, 2.76287841796875, 2.9019775390625, 3.04107666015625, 3.18017578125, 3.31927490234375, 3.4583740234375, 3.59747314453125, 3.736572265625, 3.87567138671875, 4.0147705078125, 4.15386962890625, 4.29296875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 5.0, 6.0, 6.0, 14.0, 14.0, 25.0, 41.0, 50.0, 56.0, 80.0, 119.0, 185.0, 248.0, 312.0, 425.0, 491.0, 475.0, 375.0, 308.0, 236.0, 184.0, 126.0, 91.0, 57.0, 46.0, 22.0, 28.0, 14.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.9266357421875, -4.767333984375, -4.6080322265625, -4.44873046875, -4.2894287109375, -4.130126953125, -3.9708251953125, -3.8115234375, -3.6522216796875, -3.492919921875, -3.3336181640625, -3.17431640625, -3.0150146484375, -2.855712890625, -2.6964111328125, -2.537109375, -2.3778076171875, -2.218505859375, -2.0592041015625, -1.89990234375, -1.7406005859375, -1.581298828125, -1.4219970703125, -1.2626953125, -1.1033935546875, -0.944091796875, -0.7847900390625, -0.62548828125, -0.4661865234375, -0.306884765625, -0.1475830078125, 0.01171875, 0.1710205078125, 0.330322265625, 0.4896240234375, 0.64892578125, 0.8082275390625, 0.967529296875, 1.1268310546875, 1.2861328125, 1.4454345703125, 1.604736328125, 1.7640380859375, 1.92333984375, 2.0826416015625, 2.241943359375, 2.4012451171875, 2.560546875, 2.7198486328125, 2.879150390625, 3.0384521484375, 3.19775390625, 3.3570556640625, 3.516357421875, 3.6756591796875, 3.8349609375, 3.9942626953125, 4.153564453125, 4.3128662109375, 4.47216796875, 4.6314697265625, 4.790771484375, 4.9500732421875, 5.109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 12.0, 8.0, 17.0, 18.0, 40.0, 54.0, 102.0, 120.0, 215.0, 416.0, 1050.0, 4953.0, 71356.0, 2616572.0, 1456444.0, 37808.0, 3313.0, 861.0, 341.0, 188.0, 123.0, 84.0, 46.0, 42.0, 30.0, 20.0, 10.0, 7.0, 7.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.8238525390625, -9.444580078125, -9.0653076171875, -8.68603515625, -8.3067626953125, -7.927490234375, -7.5482177734375, -7.1689453125, -6.7896728515625, -6.410400390625, -6.0311279296875, -5.65185546875, -5.2725830078125, -4.893310546875, -4.5140380859375, -4.134765625, -3.7554931640625, -3.376220703125, -2.9969482421875, -2.61767578125, -2.2384033203125, -1.859130859375, -1.4798583984375, -1.1005859375, -0.7213134765625, -0.342041015625, 0.0372314453125, 0.41650390625, 0.7957763671875, 1.175048828125, 1.5543212890625, 1.93359375, 2.3128662109375, 2.692138671875, 3.0714111328125, 3.45068359375, 3.8299560546875, 4.209228515625, 4.5885009765625, 4.9677734375, 5.3470458984375, 5.726318359375, 6.1055908203125, 6.48486328125, 6.8641357421875, 7.243408203125, 7.6226806640625, 8.001953125, 8.3812255859375, 8.760498046875, 9.1397705078125, 9.51904296875, 9.8983154296875, 10.277587890625, 10.6568603515625, 11.0361328125, 11.4154052734375, 11.794677734375, 12.1739501953125, 12.55322265625, 12.9324951171875, 13.311767578125, 13.6910400390625, 14.0703125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 26.0, 33.0, 78.0, 105.0, 153.0, 168.0, 138.0, 125.0, 86.0, 51.0, 23.0, 11.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.65777587890625, -12.658008575439453, -11.658241271972656, -10.65847396850586, -9.658706665039062, -8.658939361572266, -7.659172534942627, -6.65940523147583, -5.659637928009033, -4.659870624542236, -3.6601033210754395, -2.6603362560272217, -1.6605689525604248, -0.660801887512207, 0.33896541595458984, 1.3387327194213867, 2.3385000228881836, 3.3382673263549805, 4.338034629821777, 5.337801933288574, 6.337569236755371, 7.33733606338501, 8.337102890014648, 9.336870193481445, 10.336637496948242, 11.336404800415039, 12.336172103881836, 13.335939407348633, 14.33570671081543, 15.335474014282227, 16.335241317749023, 17.33500862121582, 18.334775924682617, 19.334543228149414, 20.33431053161621, 21.334077835083008, 22.333845138549805, 23.3336124420166, 24.3333797454834, 25.333147048950195, 26.332914352416992, 27.33268165588379, 28.332448959350586, 29.332216262817383, 30.33198356628418, 31.331750869750977, 32.33151626586914, 33.33128356933594, 34.331050872802734, 35.33081817626953, 36.33058547973633, 37.330352783203125, 38.33012008666992, 39.32988739013672, 40.329654693603516, 41.32942199707031, 42.32918930053711, 43.328956604003906, 44.3287239074707, 45.3284912109375, 46.3282585144043, 47.328025817871094, 48.32779312133789, 49.32756042480469, 50.327327728271484]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 8.0, 4.0, 5.0, 4.0, 4.0, 13.0, 7.0, 20.0, 14.0, 15.0, 18.0, 26.0, 23.0, 26.0, 30.0, 35.0, 34.0, 40.0, 42.0, 46.0, 40.0, 46.0, 42.0, 47.0, 45.0, 41.0, 36.0, 32.0, 31.0, 31.0, 28.0, 25.0, 25.0, 32.0, 17.0, 10.0, 10.0, 9.0, 14.0, 6.0, 8.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.956981658935547, -13.46343994140625, -12.969898223876953, -12.476357460021973, -11.982815742492676, -11.489274024963379, -10.995733261108398, -10.502191543579102, -10.008649826049805, -9.515108108520508, -9.021566390991211, -8.52802562713623, -8.034483909606934, -7.540942192077637, -7.047400951385498, -6.553859710693359, -6.0603179931640625, -5.566776275634766, -5.073235034942627, -4.579693794250488, -4.086152076721191, -3.5926105976104736, -3.099069118499756, -2.605527639389038, -2.1119861602783203, -1.6184446811676025, -1.1249032020568848, -0.631361722946167, -0.13782024383544922, 0.35572123527526855, 0.8492627143859863, 1.342804193496704, 1.8363456726074219, 2.3298871517181396, 2.8234286308288574, 3.316970109939575, 3.810511589050293, 4.30405330657959, 4.7975945472717285, 5.291135787963867, 5.784677505493164, 6.278219223022461, 6.7717604637146, 7.265301704406738, 7.758843421936035, 8.252385139465332, 8.745925903320312, 9.23946762084961, 9.733009338378906, 10.226551055908203, 10.7200927734375, 11.21363353729248, 11.707175254821777, 12.200716972351074, 12.694257736206055, 13.187799453735352, 13.681341171264648, 14.174882888793945, 14.668424606323242, 15.161965370178223, 15.65550708770752, 16.1490478515625, 16.642589569091797, 17.136131286621094, 17.62967300415039]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 7.0, 5.0, 6.0, 4.0, 12.0, 11.0, 15.0, 10.0, 22.0, 13.0, 15.0, 15.0, 26.0, 23.0, 21.0, 32.0, 35.0, 34.0, 38.0, 45.0, 42.0, 46.0, 44.0, 49.0, 42.0, 34.0, 39.0, 31.0, 25.0, 34.0, 27.0, 27.0, 17.0, 23.0, 19.0, 18.0, 18.0, 14.0, 11.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5201416015625, -1.468017578125, -1.4158935546875, -1.36376953125, -1.3116455078125, -1.259521484375, -1.2073974609375, -1.1552734375, -1.1031494140625, -1.051025390625, -0.9989013671875, -0.94677734375, -0.8946533203125, -0.842529296875, -0.7904052734375, -0.73828125, -0.6861572265625, -0.634033203125, -0.5819091796875, -0.52978515625, -0.4776611328125, -0.425537109375, -0.3734130859375, -0.3212890625, -0.2691650390625, -0.217041015625, -0.1649169921875, -0.11279296875, -0.0606689453125, -0.008544921875, 0.0435791015625, 0.095703125, 0.1478271484375, 0.199951171875, 0.2520751953125, 0.30419921875, 0.3563232421875, 0.408447265625, 0.4605712890625, 0.5126953125, 0.5648193359375, 0.616943359375, 0.6690673828125, 0.72119140625, 0.7733154296875, 0.825439453125, 0.8775634765625, 0.9296875, 0.9818115234375, 1.033935546875, 1.0860595703125, 1.13818359375, 1.1903076171875, 1.242431640625, 1.2945556640625, 1.3466796875, 1.3988037109375, 1.450927734375, 1.5030517578125, 1.55517578125, 1.6072998046875, 1.659423828125, 1.7115478515625, 1.763671875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 8.0, 13.0, 12.0, 15.0, 26.0, 40.0, 68.0, 106.0, 124.0, 193.0, 326.0, 435.0, 618.0, 834.0, 1183.0, 1702.0, 2553.0, 3679.0, 5353.0, 7847.0, 11582.0, 17610.0, 26781.0, 41993.0, 68393.0, 123064.0, 260443.0, 204910.0, 101747.0, 58728.0, 36425.0, 23472.0, 15467.0, 10435.0, 6842.0, 4816.0, 3306.0, 2267.0, 1573.0, 1078.0, 729.0, 540.0, 379.0, 273.0, 192.0, 120.0, 88.0, 58.0, 42.0, 30.0, 17.0, 14.0, 9.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29724884033203125, -0.2876129150390625, -0.27797698974609375, -0.268341064453125, -0.25870513916015625, -0.2490692138671875, -0.23943328857421875, -0.22979736328125, -0.22016143798828125, -0.2105255126953125, -0.20088958740234375, -0.191253662109375, -0.18161773681640625, -0.1719818115234375, -0.16234588623046875, -0.1527099609375, -0.14307403564453125, -0.1334381103515625, -0.12380218505859375, -0.114166259765625, -0.10453033447265625, -0.0948944091796875, -0.08525848388671875, -0.07562255859375, -0.06598663330078125, -0.0563507080078125, -0.04671478271484375, -0.037078857421875, -0.02744293212890625, -0.0178070068359375, -0.00817108154296875, 0.00146484375, 0.01110076904296875, 0.0207366943359375, 0.03037261962890625, 0.040008544921875, 0.04964447021484375, 0.0592803955078125, 0.06891632080078125, 0.07855224609375, 0.08818817138671875, 0.0978240966796875, 0.10746002197265625, 0.117095947265625, 0.12673187255859375, 0.1363677978515625, 0.14600372314453125, 0.1556396484375, 0.16527557373046875, 0.1749114990234375, 0.18454742431640625, 0.194183349609375, 0.20381927490234375, 0.2134552001953125, 0.22309112548828125, 0.23272705078125, 0.24236297607421875, 0.2519989013671875, 0.26163482666015625, 0.271270751953125, 0.28090667724609375, 0.2905426025390625, 0.30017852783203125, 0.309814453125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 12.0, 10.0, 12.0, 14.0, 16.0, 7.0, 16.0, 24.0, 21.0, 36.0, 28.0, 28.0, 26.0, 36.0, 24.0, 29.0, 29.0, 35.0, 30.0, 1053.0, 41.0, 34.0, 34.0, 34.0, 33.0, 32.0, 17.0, 33.0, 32.0, 25.0, 29.0, 24.0, 11.0, 33.0, 19.0, 18.0, 12.0, 11.0, 11.0, 7.0, 9.0, 12.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.9716796875, -0.9411544799804688, -0.9106292724609375, -0.8801040649414062, -0.849578857421875, -0.8190536499023438, -0.7885284423828125, -0.7580032348632812, -0.72747802734375, -0.6969528198242188, -0.6664276123046875, -0.6359024047851562, -0.605377197265625, -0.5748519897460938, -0.5443267822265625, -0.5138015747070312, -0.4832763671875, -0.45275115966796875, -0.4222259521484375, -0.39170074462890625, -0.361175537109375, -0.33065032958984375, -0.3001251220703125, -0.26959991455078125, -0.23907470703125, -0.20854949951171875, -0.1780242919921875, -0.14749908447265625, -0.116973876953125, -0.08644866943359375, -0.0559234619140625, -0.02539825439453125, 0.005126953125, 0.03565216064453125, 0.0661773681640625, 0.09670257568359375, 0.127227783203125, 0.15775299072265625, 0.1882781982421875, 0.21880340576171875, 0.24932861328125, 0.27985382080078125, 0.3103790283203125, 0.34090423583984375, 0.371429443359375, 0.40195465087890625, 0.4324798583984375, 0.46300506591796875, 0.4935302734375, 0.5240554809570312, 0.5545806884765625, 0.5851058959960938, 0.615631103515625, 0.6461563110351562, 0.6766815185546875, 0.7072067260742188, 0.73773193359375, 0.7682571411132812, 0.7987823486328125, 0.8293075561523438, 0.859832763671875, 0.8903579711914062, 0.9208831787109375, 0.9514083862304688, 0.98193359375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 11.0, 12.0, 13.0, 33.0, 53.0, 69.0, 100.0, 154.0, 242.0, 337.0, 497.0, 675.0, 1068.0, 1527.0, 2198.0, 3210.0, 4756.0, 6877.0, 10084.0, 15034.0, 22642.0, 34203.0, 54086.0, 88535.0, 159527.0, 1307727.0, 149491.0, 83884.0, 51114.0, 32801.0, 21511.0, 14145.0, 9527.0, 6458.0, 4467.0, 3145.0, 2153.0, 1540.0, 1057.0, 714.0, 502.0, 318.0, 229.0, 125.0, 98.0, 63.0, 55.0, 21.0, 16.0, 13.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.2646484375, -0.25623321533203125, -0.2478179931640625, -0.23940277099609375, -0.230987548828125, -0.22257232666015625, -0.2141571044921875, -0.20574188232421875, -0.19732666015625, -0.18891143798828125, -0.1804962158203125, -0.17208099365234375, -0.163665771484375, -0.15525054931640625, -0.1468353271484375, -0.13842010498046875, -0.1300048828125, -0.12158966064453125, -0.1131744384765625, -0.10475921630859375, -0.096343994140625, -0.08792877197265625, -0.0795135498046875, -0.07109832763671875, -0.06268310546875, -0.05426788330078125, -0.0458526611328125, -0.03743743896484375, -0.029022216796875, -0.02060699462890625, -0.0121917724609375, -0.00377655029296875, 0.004638671875, 0.01305389404296875, 0.0214691162109375, 0.02988433837890625, 0.038299560546875, 0.04671478271484375, 0.0551300048828125, 0.06354522705078125, 0.07196044921875, 0.08037567138671875, 0.0887908935546875, 0.09720611572265625, 0.105621337890625, 0.11403656005859375, 0.1224517822265625, 0.13086700439453125, 0.1392822265625, 0.14769744873046875, 0.1561126708984375, 0.16452789306640625, 0.172943115234375, 0.18135833740234375, 0.1897735595703125, 0.19818878173828125, 0.20660400390625, 0.21501922607421875, 0.2234344482421875, 0.23184967041015625, 0.240264892578125, 0.24868011474609375, 0.2570953369140625, 0.26551055908203125, 0.27392578125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 2.0, 8.0, 4.0, 11.0, 8.0, 10.0, 7.0, 10.0, 16.0, 17.0, 17.0, 17.0, 28.0, 44.0, 53.0, 45.0, 41.0, 64.0, 60.0, 59.0, 67.0, 48.0, 55.0, 36.0, 44.0, 43.0, 33.0, 23.0, 29.0, 19.0, 17.0, 13.0, 3.0, 5.0, 5.0, 9.0, 6.0, 8.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.00022685527801513672, -0.000220518559217453, -0.0002141818404197693, -0.00020784512162208557, -0.00020150840282440186, -0.00019517168402671814, -0.00018883496522903442, -0.0001824982464313507, -0.000176161527633667, -0.00016982480883598328, -0.00016348809003829956, -0.00015715137124061584, -0.00015081465244293213, -0.0001444779336452484, -0.0001381412148475647, -0.00013180449604988098, -0.00012546777725219727, -0.00011913105845451355, -0.00011279433965682983, -0.00010645762085914612, -0.0001001209020614624, -9.378418326377869e-05, -8.744746446609497e-05, -8.111074566841125e-05, -7.477402687072754e-05, -6.843730807304382e-05, -6.210058927536011e-05, -5.576387047767639e-05, -4.9427151679992676e-05, -4.309043288230896e-05, -3.6753714084625244e-05, -3.041699528694153e-05, -2.4080276489257812e-05, -1.7743557691574097e-05, -1.1406838893890381e-05, -5.070120096206665e-06, 1.2665987014770508e-06, 7.603317499160767e-06, 1.3940036296844482e-05, 2.0276755094528198e-05, 2.6613473892211914e-05, 3.295019268989563e-05, 3.9286911487579346e-05, 4.562363028526306e-05, 5.196034908294678e-05, 5.829706788063049e-05, 6.463378667831421e-05, 7.097050547599792e-05, 7.730722427368164e-05, 8.364394307136536e-05, 8.998066186904907e-05, 9.631738066673279e-05, 0.0001026540994644165, 0.00010899081826210022, 0.00011532753705978394, 0.00012166425585746765, 0.00012800097465515137, 0.00013433769345283508, 0.0001406744122505188, 0.00014701113104820251, 0.00015334784984588623, 0.00015968456864356995, 0.00016602128744125366, 0.00017235800623893738, 0.0001786947250366211]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 13.0, 11.0, 19.0, 25.0, 31.0, 40.0, 55.0, 56.0, 81.0, 83.0, 115.0, 187.0, 223.0, 356.0, 491.0, 1668.0, 133911.0, 899980.0, 8834.0, 794.0, 425.0, 295.0, 189.0, 144.0, 108.0, 67.0, 47.0, 58.0, 40.0, 26.0, 22.0, 24.0, 24.0, 19.0, 15.0, 16.0, 6.0, 9.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00284576416015625, -0.00274503231048584, -0.0026443004608154297, -0.0025435686111450195, -0.0024428367614746094, -0.0023421049118041992, -0.002241373062133789, -0.002140641212463379, -0.0020399093627929688, -0.0019391775131225586, -0.0018384456634521484, -0.0017377138137817383, -0.0016369819641113281, -0.001536250114440918, -0.0014355182647705078, -0.0013347864151000977, -0.0012340545654296875, -0.0011333227157592773, -0.0010325908660888672, -0.000931859016418457, -0.0008311271667480469, -0.0007303953170776367, -0.0006296634674072266, -0.0005289316177368164, -0.00042819976806640625, -0.0003274679183959961, -0.00022673606872558594, -0.00012600421905517578, -2.5272369384765625e-05, 7.545948028564453e-05, 0.0001761913299560547, 0.00027692317962646484, 0.000377655029296875, 0.00047838687896728516, 0.0005791187286376953, 0.0006798505783081055, 0.0007805824279785156, 0.0008813142776489258, 0.000982046127319336, 0.001082777976989746, 0.0011835098266601562, 0.0012842416763305664, 0.0013849735260009766, 0.0014857053756713867, 0.0015864372253417969, 0.001687169075012207, 0.0017879009246826172, 0.0018886327743530273, 0.0019893646240234375, 0.0020900964736938477, 0.002190828323364258, 0.002291560173034668, 0.002392292022705078, 0.0024930238723754883, 0.0025937557220458984, 0.0026944875717163086, 0.0027952194213867188, 0.002895951271057129, 0.002996683120727539, 0.0030974149703979492, 0.0031981468200683594, 0.0032988786697387695, 0.0033996105194091797, 0.00350034236907959, 0.00360107421875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 17.0, 39.0, 84.0, 172.0, 225.0, 210.0, 136.0, 67.0, 37.0, 14.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040207267738878727, -0.00039331018342636526, -0.0003845477185677737, -0.0003757852246053517, -0.0003670227306429297, -0.00035826023668050766, -0.0003494977718219161, -0.0003407352778594941, -0.0003319727838970721, -0.00032321028993465006, -0.0003144478250760585, -0.0003056853311136365, -0.0002969228371512145, -0.00028816034318879247, -0.0002793978783302009, -0.0002706353843677789, -0.0002618728904053569, -0.00025311039644293487, -0.0002443479315843433, -0.0002355854376219213, -0.0002268229436594993, -0.0002180604642489925, -0.00020929798483848572, -0.0002005354908760637, -0.00019177302601747215, -0.00018301054660696536, -0.00017424805264454335, -0.00016548557323403656, -0.00015672307927161455, -0.00014796059986110777, -0.00013919812045060098, -0.00013043562648817897, -0.00012167311797384173, -0.00011291063128737733, -0.00010414814460091293, -9.538566519040614e-05, -8.662317122798413e-05, -7.786069181747735e-05, -6.909820513101295e-05, -6.033571844454855e-05, -5.157323175808415e-05, -4.281074507161975e-05, -3.404825838515535e-05, -2.5285775336669758e-05, -1.652328865020536e-05, -7.76080196374096e-06, 1.0016810847446322e-06, 9.764167771209031e-06, 1.852665445767343e-05, 2.728914114413783e-05, 3.605162783060223e-05, 4.481411087908782e-05, 5.357659756555222e-05, 6.233908061403781e-05, 7.110156730050221e-05, 7.986405398696661e-05, 8.862654067343101e-05, 9.738902735989541e-05, 0.00010615151404635981, 0.0001149140007328242, 0.000123676480143331, 0.000132438974105753, 0.0001412014535162598, 0.0001499639474786818, 0.0001587264268891886]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 8.0, 15.0, 13.0, 13.0, 20.0, 22.0, 15.0, 26.0, 33.0, 24.0, 28.0, 55.0, 35.0, 35.0, 37.0, 43.0, 42.0, 29.0, 35.0, 27.0, 41.0, 37.0, 32.0, 33.0, 21.0, 35.0, 35.0, 22.0, 24.0, 31.0, 16.0, 20.0, 16.0, 13.0, 12.0, 6.0, 2.0, 7.0, 3.0, 9.0, 1.0, 4.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00010120868682861328, -9.79127362370491e-05, -9.461678564548492e-05, -9.132083505392075e-05, -8.802488446235657e-05, -8.472893387079239e-05, -8.143298327922821e-05, -7.813703268766403e-05, -7.484108209609985e-05, -7.154513150453568e-05, -6.82491809129715e-05, -6.495323032140732e-05, -6.165727972984314e-05, -5.836132913827896e-05, -5.506537854671478e-05, -5.1769427955150604e-05, -4.8473477363586426e-05, -4.517752677202225e-05, -4.188157618045807e-05, -3.858562558889389e-05, -3.528967499732971e-05, -3.1993724405765533e-05, -2.8697773814201355e-05, -2.5401823222637177e-05, -2.2105872631072998e-05, -1.880992203950882e-05, -1.551397144794464e-05, -1.2218020856380463e-05, -8.922070264816284e-06, -5.626119673252106e-06, -2.3301690816879272e-06, 9.657815098762512e-07, 4.26173210144043e-06, 7.557682693004608e-06, 1.0853633284568787e-05, 1.4149583876132965e-05, 1.7445534467697144e-05, 2.0741485059261322e-05, 2.40374356508255e-05, 2.733338624238968e-05, 3.062933683395386e-05, 3.3925287425518036e-05, 3.7221238017082214e-05, 4.051718860864639e-05, 4.381313920021057e-05, 4.710908979177475e-05, 5.040504038333893e-05, 5.370099097490311e-05, 5.6996941566467285e-05, 6.0292892158031464e-05, 6.358884274959564e-05, 6.688479334115982e-05, 7.0180743932724e-05, 7.347669452428818e-05, 7.677264511585236e-05, 8.006859570741653e-05, 8.336454629898071e-05, 8.666049689054489e-05, 8.995644748210907e-05, 9.325239807367325e-05, 9.654834866523743e-05, 9.98442992568016e-05, 0.00010314024984836578, 0.00010643620043992996, 0.00010973215103149414]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 7.0, 5.0, 6.0, 4.0, 12.0, 11.0, 15.0, 10.0, 22.0, 13.0, 15.0, 15.0, 26.0, 23.0, 21.0, 32.0, 35.0, 34.0, 38.0, 45.0, 42.0, 46.0, 44.0, 49.0, 42.0, 34.0, 39.0, 31.0, 25.0, 34.0, 27.0, 27.0, 17.0, 23.0, 19.0, 18.0, 18.0, 14.0, 11.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5201416015625, -1.468017578125, -1.4158935546875, -1.36376953125, -1.3116455078125, -1.259521484375, -1.2073974609375, -1.1552734375, -1.1031494140625, -1.051025390625, -0.9989013671875, -0.94677734375, -0.8946533203125, -0.842529296875, -0.7904052734375, -0.73828125, -0.6861572265625, -0.634033203125, -0.5819091796875, -0.52978515625, -0.4776611328125, -0.425537109375, -0.3734130859375, -0.3212890625, -0.2691650390625, -0.217041015625, -0.1649169921875, -0.11279296875, -0.0606689453125, -0.008544921875, 0.0435791015625, 0.095703125, 0.1478271484375, 0.199951171875, 0.2520751953125, 0.30419921875, 0.3563232421875, 0.408447265625, 0.4605712890625, 0.5126953125, 0.5648193359375, 0.616943359375, 0.6690673828125, 0.72119140625, 0.7733154296875, 0.825439453125, 0.8775634765625, 0.9296875, 0.9818115234375, 1.033935546875, 1.0860595703125, 1.13818359375, 1.1903076171875, 1.242431640625, 1.2945556640625, 1.3466796875, 1.3988037109375, 1.450927734375, 1.5030517578125, 1.55517578125, 1.6072998046875, 1.659423828125, 1.7115478515625, 1.763671875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 12.0, 10.0, 14.0, 17.0, 26.0, 29.0, 49.0, 60.0, 90.0, 123.0, 178.0, 277.0, 388.0, 587.0, 981.0, 1692.0, 2917.0, 5442.0, 10368.0, 22412.0, 56867.0, 184221.0, 455573.0, 197669.0, 60898.0, 23707.0, 10616.0, 5503.0, 3035.0, 1821.0, 1071.0, 624.0, 402.0, 263.0, 174.0, 121.0, 98.0, 59.0, 45.0, 30.0, 25.0, 15.0, 11.0, 12.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.251953125, -2.175689697265625, -2.09942626953125, -2.023162841796875, -1.9468994140625, -1.870635986328125, -1.79437255859375, -1.718109130859375, -1.641845703125, -1.565582275390625, -1.48931884765625, -1.413055419921875, -1.3367919921875, -1.260528564453125, -1.18426513671875, -1.108001708984375, -1.03173828125, -0.955474853515625, -0.87921142578125, -0.802947998046875, -0.7266845703125, -0.650421142578125, -0.57415771484375, -0.497894287109375, -0.421630859375, -0.345367431640625, -0.26910400390625, -0.192840576171875, -0.1165771484375, -0.040313720703125, 0.03594970703125, 0.112213134765625, 0.1884765625, 0.264739990234375, 0.34100341796875, 0.417266845703125, 0.4935302734375, 0.569793701171875, 0.64605712890625, 0.722320556640625, 0.798583984375, 0.874847412109375, 0.95111083984375, 1.027374267578125, 1.1036376953125, 1.179901123046875, 1.25616455078125, 1.332427978515625, 1.40869140625, 1.484954833984375, 1.56121826171875, 1.637481689453125, 1.7137451171875, 1.790008544921875, 1.86627197265625, 1.942535400390625, 2.018798828125, 2.095062255859375, 2.17132568359375, 2.247589111328125, 2.3238525390625, 2.400115966796875, 2.47637939453125, 2.552642822265625, 2.62890625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 5.0, 6.0, 10.0, 15.0, 10.0, 12.0, 16.0, 14.0, 15.0, 14.0, 25.0, 20.0, 31.0, 42.0, 43.0, 44.0, 43.0, 73.0, 110.0, 182.0, 1392.0, 296.0, 129.0, 79.0, 54.0, 42.0, 47.0, 30.0, 30.0, 27.0, 20.0, 23.0, 21.0, 26.0, 25.0, 9.0, 15.0, 11.0, 5.0, 8.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76171875, -5.5743408203125, -5.386962890625, -5.1995849609375, -5.01220703125, -4.8248291015625, -4.637451171875, -4.4500732421875, -4.2626953125, -4.0753173828125, -3.887939453125, -3.7005615234375, -3.51318359375, -3.3258056640625, -3.138427734375, -2.9510498046875, -2.763671875, -2.5762939453125, -2.388916015625, -2.2015380859375, -2.01416015625, -1.8267822265625, -1.639404296875, -1.4520263671875, -1.2646484375, -1.0772705078125, -0.889892578125, -0.7025146484375, -0.51513671875, -0.3277587890625, -0.140380859375, 0.0469970703125, 0.234375, 0.4217529296875, 0.609130859375, 0.7965087890625, 0.98388671875, 1.1712646484375, 1.358642578125, 1.5460205078125, 1.7333984375, 1.9207763671875, 2.108154296875, 2.2955322265625, 2.48291015625, 2.6702880859375, 2.857666015625, 3.0450439453125, 3.232421875, 3.4197998046875, 3.607177734375, 3.7945556640625, 3.98193359375, 4.1693115234375, 4.356689453125, 4.5440673828125, 4.7314453125, 4.9188232421875, 5.106201171875, 5.2935791015625, 5.48095703125, 5.6683349609375, 5.855712890625, 6.0430908203125, 6.23046875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 2.0, 7.0, 11.0, 21.0, 38.0, 39.0, 73.0, 117.0, 181.0, 374.0, 1246.0, 36173.0, 3093095.0, 12571.0, 943.0, 320.0, 165.0, 98.0, 66.0, 48.0, 34.0, 20.0, 22.0, 15.0, 6.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.5625, -25.790283203125, -25.01806640625, -24.245849609375, -23.4736328125, -22.701416015625, -21.92919921875, -21.156982421875, -20.384765625, -19.612548828125, -18.84033203125, -18.068115234375, -17.2958984375, -16.523681640625, -15.75146484375, -14.979248046875, -14.20703125, -13.434814453125, -12.66259765625, -11.890380859375, -11.1181640625, -10.345947265625, -9.57373046875, -8.801513671875, -8.029296875, -7.257080078125, -6.48486328125, -5.712646484375, -4.9404296875, -4.168212890625, -3.39599609375, -2.623779296875, -1.8515625, -1.079345703125, -0.30712890625, 0.465087890625, 1.2373046875, 2.009521484375, 2.78173828125, 3.553955078125, 4.326171875, 5.098388671875, 5.87060546875, 6.642822265625, 7.4150390625, 8.187255859375, 8.95947265625, 9.731689453125, 10.50390625, 11.276123046875, 12.04833984375, 12.820556640625, 13.5927734375, 14.364990234375, 15.13720703125, 15.909423828125, 16.681640625, 17.453857421875, 18.22607421875, 18.998291015625, 19.7705078125, 20.542724609375, 21.31494140625, 22.087158203125, 22.859375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 10.0, 144.0, 560.0, 282.0, 19.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-102.21324920654297, -100.40779113769531, -98.60233306884766, -96.796875, -94.99141693115234, -93.18595886230469, -91.38050079345703, -89.57504272460938, -87.76958465576172, -85.96412658691406, -84.1586685180664, -82.35321044921875, -80.5477523803711, -78.74229431152344, -76.93683624267578, -75.13137817382812, -73.32592010498047, -71.52046203613281, -69.71500396728516, -67.9095458984375, -66.10408782958984, -64.29862976074219, -62.49317169189453, -60.687713623046875, -58.882259368896484, -57.07680130004883, -55.27134323120117, -53.465885162353516, -51.66042709350586, -49.8549690246582, -48.04951095581055, -46.24405288696289, -44.43859100341797, -42.63313293457031, -40.827674865722656, -39.022216796875, -37.216758728027344, -35.41130065917969, -33.60584259033203, -31.800384521484375, -29.994930267333984, -28.189472198486328, -26.384014129638672, -24.578556060791016, -22.77309799194336, -20.967639923095703, -19.162181854248047, -17.35672378540039, -15.551265716552734, -13.745807647705078, -11.940349578857422, -10.134891510009766, -8.32943344116211, -6.5239763259887695, -4.718518257141113, -2.913060188293457, -1.1076021194458008, 0.6978558301925659, 2.5033137798309326, 4.30877161026001, 6.114229679107666, 7.919687271118164, 9.72514533996582, 11.530603408813477, 13.336061477661133]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 7.0, 11.0, 10.0, 9.0, 8.0, 9.0, 15.0, 9.0, 10.0, 24.0, 15.0, 31.0, 19.0, 37.0, 16.0, 27.0, 30.0, 23.0, 31.0, 32.0, 32.0, 41.0, 32.0, 41.0, 44.0, 43.0, 36.0, 38.0, 25.0, 42.0, 27.0, 30.0, 26.0, 19.0, 21.0, 24.0, 18.0, 16.0, 19.0, 6.0, 9.0, 9.0, 7.0, 4.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.81233024597168, -17.27786636352539, -16.7434024810791, -16.208938598632812, -15.674473762512207, -15.140008926391602, -14.605545043945312, -14.071081161499023, -13.536617279052734, -13.002153396606445, -12.46768856048584, -11.93322467803955, -11.398760795593262, -10.864295959472656, -10.329832077026367, -9.795368194580078, -9.260903358459473, -8.726439476013184, -8.191974639892578, -7.657510757446289, -7.123046875, -6.588582515716553, -6.0541181564331055, -5.519654273986816, -4.985189914703369, -4.450725555419922, -3.916261672973633, -3.3817973136901855, -2.8473331928253174, -2.312869071960449, -1.778404712677002, -1.2439405918121338, -0.7094764709472656, -0.17501229047775269, 0.35945188999176025, 0.893916130065918, 1.4283802509307861, 1.9628443717956543, 2.4973087310791016, 3.0317728519439697, 3.566236972808838, 4.100701332092285, 4.635165214538574, 5.1696295738220215, 5.704093933105469, 6.238557815551758, 6.773022174835205, 7.307486534118652, 7.841950416564941, 8.37641429901123, 8.910879135131836, 9.445343017578125, 9.979806900024414, 10.514270782470703, 11.048735618591309, 11.583199501037598, 12.117664337158203, 12.652128219604492, 13.186593055725098, 13.721056938171387, 14.255520820617676, 14.789985656738281, 15.32444953918457, 15.85891342163086, 16.39337730407715]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 4.0, 6.0, 6.0, 6.0, 6.0, 9.0, 12.0, 13.0, 12.0, 13.0, 10.0, 16.0, 27.0, 29.0, 32.0, 22.0, 25.0, 28.0, 31.0, 40.0, 40.0, 35.0, 40.0, 40.0, 39.0, 35.0, 33.0, 33.0, 35.0, 46.0, 29.0, 24.0, 19.0, 31.0, 25.0, 23.0, 14.0, 17.0, 11.0, 13.0, 13.0, 14.0, 6.0, 5.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.6435546875, -1.5915069580078125, -1.539459228515625, -1.4874114990234375, -1.43536376953125, -1.3833160400390625, -1.331268310546875, -1.2792205810546875, -1.2271728515625, -1.1751251220703125, -1.123077392578125, -1.0710296630859375, -1.01898193359375, -0.9669342041015625, -0.914886474609375, -0.8628387451171875, -0.810791015625, -0.7587432861328125, -0.706695556640625, -0.6546478271484375, -0.60260009765625, -0.5505523681640625, -0.498504638671875, -0.4464569091796875, -0.3944091796875, -0.3423614501953125, -0.290313720703125, -0.2382659912109375, -0.18621826171875, -0.1341705322265625, -0.082122802734375, -0.0300750732421875, 0.02197265625, 0.0740203857421875, 0.126068115234375, 0.1781158447265625, 0.23016357421875, 0.2822113037109375, 0.334259033203125, 0.3863067626953125, 0.4383544921875, 0.4904022216796875, 0.542449951171875, 0.5944976806640625, 0.64654541015625, 0.6985931396484375, 0.750640869140625, 0.8026885986328125, 0.854736328125, 0.9067840576171875, 0.958831787109375, 1.0108795166015625, 1.06292724609375, 1.1149749755859375, 1.167022705078125, 1.2190704345703125, 1.2711181640625, 1.3231658935546875, 1.375213623046875, 1.4272613525390625, 1.47930908203125, 1.5313568115234375, 1.583404541015625, 1.6354522705078125, 1.6875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 6.0, 17.0, 14.0, 17.0, 28.0, 36.0, 46.0, 74.0, 99.0, 139.0, 222.0, 333.0, 559.0, 1021.0, 2093.0, 4759.0, 11658.0, 32405.0, 101002.0, 333404.0, 909759.0, 1400407.0, 902799.0, 336663.0, 102817.0, 32302.0, 11773.0, 4868.0, 2208.0, 1127.0, 540.0, 329.0, 216.0, 149.0, 96.0, 84.0, 58.0, 30.0, 23.0, 24.0, 13.0, 15.0, 13.0, 3.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.27734375, -2.207275390625, -2.13720703125, -2.067138671875, -1.9970703125, -1.927001953125, -1.85693359375, -1.786865234375, -1.716796875, -1.646728515625, -1.57666015625, -1.506591796875, -1.4365234375, -1.366455078125, -1.29638671875, -1.226318359375, -1.15625, -1.086181640625, -1.01611328125, -0.946044921875, -0.8759765625, -0.805908203125, -0.73583984375, -0.665771484375, -0.595703125, -0.525634765625, -0.45556640625, -0.385498046875, -0.3154296875, -0.245361328125, -0.17529296875, -0.105224609375, -0.03515625, 0.034912109375, 0.10498046875, 0.175048828125, 0.2451171875, 0.315185546875, 0.38525390625, 0.455322265625, 0.525390625, 0.595458984375, 0.66552734375, 0.735595703125, 0.8056640625, 0.875732421875, 0.94580078125, 1.015869140625, 1.0859375, 1.156005859375, 1.22607421875, 1.296142578125, 1.3662109375, 1.436279296875, 1.50634765625, 1.576416015625, 1.646484375, 1.716552734375, 1.78662109375, 1.856689453125, 1.9267578125, 1.996826171875, 2.06689453125, 2.136962890625, 2.20703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 12.0, 11.0, 7.0, 10.0, 19.0, 25.0, 47.0, 45.0, 69.0, 98.0, 130.0, 170.0, 216.0, 263.0, 356.0, 395.0, 406.0, 337.0, 271.0, 259.0, 208.0, 188.0, 137.0, 94.0, 65.0, 49.0, 51.0, 30.0, 24.0, 24.0, 18.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.91400146484375, -3.7811279296875, -3.64825439453125, -3.515380859375, -3.38250732421875, -3.2496337890625, -3.11676025390625, -2.98388671875, -2.85101318359375, -2.7181396484375, -2.58526611328125, -2.452392578125, -2.31951904296875, -2.1866455078125, -2.05377197265625, -1.9208984375, -1.78802490234375, -1.6551513671875, -1.52227783203125, -1.389404296875, -1.25653076171875, -1.1236572265625, -0.99078369140625, -0.85791015625, -0.72503662109375, -0.5921630859375, -0.45928955078125, -0.326416015625, -0.19354248046875, -0.0606689453125, 0.07220458984375, 0.205078125, 0.33795166015625, 0.4708251953125, 0.60369873046875, 0.736572265625, 0.86944580078125, 1.0023193359375, 1.13519287109375, 1.26806640625, 1.40093994140625, 1.5338134765625, 1.66668701171875, 1.799560546875, 1.93243408203125, 2.0653076171875, 2.19818115234375, 2.3310546875, 2.46392822265625, 2.5968017578125, 2.72967529296875, 2.862548828125, 2.99542236328125, 3.1282958984375, 3.26116943359375, 3.39404296875, 3.52691650390625, 3.6597900390625, 3.79266357421875, 3.925537109375, 4.05841064453125, 4.1912841796875, 4.32415771484375, 4.45703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 11.0, 25.0, 25.0, 42.0, 48.0, 60.0, 67.0, 115.0, 218.0, 460.0, 1619.0, 12262.0, 310012.0, 3470945.0, 381343.0, 14146.0, 1695.0, 510.0, 221.0, 130.0, 96.0, 61.0, 41.0, 23.0, 19.0, 19.0, 18.0, 9.0, 12.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.10498046875, -10.7412109375, -10.37744140625, -10.013671875, -9.64990234375, -9.2861328125, -8.92236328125, -8.55859375, -8.19482421875, -7.8310546875, -7.46728515625, -7.103515625, -6.73974609375, -6.3759765625, -6.01220703125, -5.6484375, -5.28466796875, -4.9208984375, -4.55712890625, -4.193359375, -3.82958984375, -3.4658203125, -3.10205078125, -2.73828125, -2.37451171875, -2.0107421875, -1.64697265625, -1.283203125, -0.91943359375, -0.5556640625, -0.19189453125, 0.171875, 0.53564453125, 0.8994140625, 1.26318359375, 1.626953125, 1.99072265625, 2.3544921875, 2.71826171875, 3.08203125, 3.44580078125, 3.8095703125, 4.17333984375, 4.537109375, 4.90087890625, 5.2646484375, 5.62841796875, 5.9921875, 6.35595703125, 6.7197265625, 7.08349609375, 7.447265625, 7.81103515625, 8.1748046875, 8.53857421875, 8.90234375, 9.26611328125, 9.6298828125, 9.99365234375, 10.357421875, 10.72119140625, 11.0849609375, 11.44873046875, 11.8125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 22.0, 68.0, 182.0, 252.0, 216.0, 158.0, 75.0, 23.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.831392288208008, -13.320860862731934, -11.81032943725586, -10.299797058105469, -8.789265632629395, -7.27873420715332, -5.76820182800293, -4.2576704025268555, -2.7471389770507812, -1.236607313156128, 0.2739243507385254, 1.7844562530517578, 3.294987678527832, 4.805519104003906, 6.316051483154297, 7.826582908630371, 9.337114334106445, 10.84764575958252, 12.358177185058594, 13.868709564208984, 15.379240989685059, 16.889772415161133, 18.400304794311523, 19.91083526611328, 21.421367645263672, 22.931900024414062, 24.44243049621582, 25.95296287536621, 27.46349334716797, 28.97402572631836, 30.48455810546875, 31.99509048461914, 33.50562286376953, 35.01615524291992, 36.52668762207031, 38.03721618652344, 39.54774856567383, 41.05828094482422, 42.56881332397461, 44.079345703125, 45.589874267578125, 47.100406646728516, 48.610939025878906, 50.12146759033203, 51.63199996948242, 53.14253234863281, 54.6530647277832, 56.163597106933594, 57.674129486083984, 59.184661865234375, 60.695194244384766, 62.205726623535156, 63.71625518798828, 65.22679138183594, 66.73731994628906, 68.24784851074219, 69.75838470458984, 71.26891326904297, 72.77944946289062, 74.28997802734375, 75.8005142211914, 77.31104278564453, 78.82157897949219, 80.33210754394531, 81.84263610839844]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 10.0, 4.0, 5.0, 11.0, 14.0, 8.0, 19.0, 15.0, 20.0, 27.0, 27.0, 26.0, 23.0, 49.0, 39.0, 50.0, 43.0, 52.0, 37.0, 45.0, 49.0, 47.0, 36.0, 38.0, 32.0, 31.0, 29.0, 33.0, 30.0, 23.0, 27.0, 19.0, 22.0, 7.0, 10.0, 8.0, 6.0, 13.0, 7.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.446765899658203, -16.941373825073242, -16.43597984313965, -15.930586814880371, -15.425193786621094, -14.919801712036133, -14.414408683776855, -13.909015655517578, -13.4036226272583, -12.898229598999023, -12.392836570739746, -11.887443542480469, -11.382051467895508, -10.876657485961914, -10.371265411376953, -9.865872383117676, -9.360479354858398, -8.855086326599121, -8.349693298339844, -7.844300746917725, -7.338907718658447, -6.83351469039917, -6.328122138977051, -5.822729110717773, -5.317336082458496, -4.811943054199219, -4.306550025939941, -3.8011574745178223, -3.295764446258545, -2.7903714179992676, -2.2849786281585693, -1.779585838317871, -1.2741947174072266, -0.7688018083572388, -0.263408899307251, 0.24198400974273682, 0.7473769187927246, 1.252769947052002, 1.7581627368927002, 2.2635555267333984, 2.768948554992676, 3.274341583251953, 3.7797343730926514, 4.28512716293335, 4.790520191192627, 5.295913219451904, 5.801305770874023, 6.306698799133301, 6.812091827392578, 7.3174848556518555, 7.822877883911133, 8.32827091217041, 8.833663940429688, 9.339056015014648, 9.844449043273926, 10.349842071533203, 10.85523509979248, 11.360628128051758, 11.866021156311035, 12.371414184570312, 12.876806259155273, 13.382200241088867, 13.887592315673828, 14.392985343933105, 14.898378372192383]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 10.0, 15.0, 8.0, 5.0, 8.0, 15.0, 19.0, 21.0, 22.0, 33.0, 20.0, 27.0, 33.0, 26.0, 45.0, 44.0, 44.0, 38.0, 32.0, 44.0, 39.0, 38.0, 38.0, 40.0, 43.0, 31.0, 31.0, 38.0, 25.0, 23.0, 25.0, 8.0, 12.0, 16.0, 13.0, 13.0, 6.0, 8.0, 5.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7421875, -1.6841278076171875, -1.626068115234375, -1.5680084228515625, -1.50994873046875, -1.4518890380859375, -1.393829345703125, -1.3357696533203125, -1.2777099609375, -1.2196502685546875, -1.161590576171875, -1.1035308837890625, -1.04547119140625, -0.9874114990234375, -0.929351806640625, -0.8712921142578125, -0.813232421875, -0.7551727294921875, -0.697113037109375, -0.6390533447265625, -0.58099365234375, -0.5229339599609375, -0.464874267578125, -0.4068145751953125, -0.3487548828125, -0.2906951904296875, -0.232635498046875, -0.1745758056640625, -0.11651611328125, -0.0584564208984375, -0.000396728515625, 0.0576629638671875, 0.11572265625, 0.1737823486328125, 0.231842041015625, 0.2899017333984375, 0.34796142578125, 0.4060211181640625, 0.464080810546875, 0.5221405029296875, 0.5802001953125, 0.6382598876953125, 0.696319580078125, 0.7543792724609375, 0.81243896484375, 0.8704986572265625, 0.928558349609375, 0.9866180419921875, 1.044677734375, 1.1027374267578125, 1.160797119140625, 1.2188568115234375, 1.27691650390625, 1.3349761962890625, 1.393035888671875, 1.4510955810546875, 1.5091552734375, 1.5672149658203125, 1.625274658203125, 1.6833343505859375, 1.74139404296875, 1.7994537353515625, 1.857513427734375, 1.9155731201171875, 1.9736328125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 7.0, 4.0, 8.0, 14.0, 24.0, 29.0, 43.0, 66.0, 99.0, 149.0, 187.0, 312.0, 417.0, 672.0, 968.0, 1361.0, 2032.0, 2893.0, 4263.0, 6013.0, 9129.0, 13329.0, 20393.0, 31397.0, 51219.0, 87215.0, 165808.0, 283212.0, 150000.0, 80975.0, 47764.0, 29522.0, 19304.0, 12575.0, 8542.0, 5955.0, 3961.0, 2736.0, 1875.0, 1274.0, 880.0, 601.0, 449.0, 273.0, 213.0, 137.0, 96.0, 60.0, 39.0, 28.0, 14.0, 10.0, 13.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.323486328125, -0.31319427490234375, -0.3029022216796875, -0.29261016845703125, -0.282318115234375, -0.27202606201171875, -0.2617340087890625, -0.25144195556640625, -0.24114990234375, -0.23085784912109375, -0.2205657958984375, -0.21027374267578125, -0.199981689453125, -0.18968963623046875, -0.1793975830078125, -0.16910552978515625, -0.1588134765625, -0.14852142333984375, -0.1382293701171875, -0.12793731689453125, -0.117645263671875, -0.10735321044921875, -0.0970611572265625, -0.08676910400390625, -0.07647705078125, -0.06618499755859375, -0.0558929443359375, -0.04560089111328125, -0.035308837890625, -0.02501678466796875, -0.0147247314453125, -0.00443267822265625, 0.005859375, 0.01615142822265625, 0.0264434814453125, 0.03673553466796875, 0.047027587890625, 0.05731964111328125, 0.0676116943359375, 0.07790374755859375, 0.08819580078125, 0.09848785400390625, 0.1087799072265625, 0.11907196044921875, 0.129364013671875, 0.13965606689453125, 0.1499481201171875, 0.16024017333984375, 0.1705322265625, 0.18082427978515625, 0.1911163330078125, 0.20140838623046875, 0.211700439453125, 0.22199249267578125, 0.2322845458984375, 0.24257659912109375, 0.25286865234375, 0.26316070556640625, 0.2734527587890625, 0.28374481201171875, 0.294036865234375, 0.30432891845703125, 0.3146209716796875, 0.32491302490234375, 0.335205078125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 6.0, 5.0, 4.0, 4.0, 8.0, 2.0, 9.0, 10.0, 10.0, 14.0, 18.0, 27.0, 15.0, 21.0, 25.0, 32.0, 34.0, 38.0, 35.0, 29.0, 34.0, 39.0, 31.0, 1072.0, 51.0, 49.0, 36.0, 44.0, 41.0, 37.0, 34.0, 20.0, 30.0, 26.0, 22.0, 22.0, 12.0, 13.0, 16.0, 9.0, 12.0, 9.0, 7.0, 4.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2392578125, -1.2024078369140625, -1.165557861328125, -1.1287078857421875, -1.09185791015625, -1.0550079345703125, -1.018157958984375, -0.9813079833984375, -0.9444580078125, -0.9076080322265625, -0.870758056640625, -0.8339080810546875, -0.79705810546875, -0.7602081298828125, -0.723358154296875, -0.6865081787109375, -0.649658203125, -0.6128082275390625, -0.575958251953125, -0.5391082763671875, -0.50225830078125, -0.4654083251953125, -0.428558349609375, -0.3917083740234375, -0.3548583984375, -0.3180084228515625, -0.281158447265625, -0.2443084716796875, -0.20745849609375, -0.1706085205078125, -0.133758544921875, -0.0969085693359375, -0.06005859375, -0.0232086181640625, 0.013641357421875, 0.0504913330078125, 0.08734130859375, 0.1241912841796875, 0.161041259765625, 0.1978912353515625, 0.2347412109375, 0.2715911865234375, 0.308441162109375, 0.3452911376953125, 0.38214111328125, 0.4189910888671875, 0.455841064453125, 0.4926910400390625, 0.529541015625, 0.5663909912109375, 0.603240966796875, 0.6400909423828125, 0.67694091796875, 0.7137908935546875, 0.750640869140625, 0.7874908447265625, 0.8243408203125, 0.8611907958984375, 0.898040771484375, 0.9348907470703125, 0.97174072265625, 1.0085906982421875, 1.045440673828125, 1.0822906494140625, 1.119140625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 4.0, 16.0, 13.0, 26.0, 37.0, 50.0, 76.0, 99.0, 144.0, 244.0, 358.0, 489.0, 737.0, 1093.0, 1660.0, 2400.0, 3477.0, 5183.0, 7527.0, 11576.0, 17713.0, 28041.0, 45921.0, 80403.0, 155560.0, 1348125.0, 168058.0, 84978.0, 48978.0, 29454.0, 18487.0, 11909.0, 7697.0, 5224.0, 3497.0, 2412.0, 1745.0, 1183.0, 800.0, 545.0, 401.0, 258.0, 191.0, 118.0, 78.0, 47.0, 37.0, 27.0, 14.0, 9.0, 6.0, 0.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.33544921875, -0.3254508972167969, -0.31545257568359375, -0.3054542541503906, -0.2954559326171875, -0.2854576110839844, -0.27545928955078125, -0.2654609680175781, -0.255462646484375, -0.24546432495117188, -0.23546600341796875, -0.22546768188476562, -0.2154693603515625, -0.20547103881835938, -0.19547271728515625, -0.18547439575195312, -0.17547607421875, -0.16547775268554688, -0.15547943115234375, -0.14548110961914062, -0.1354827880859375, -0.12548446655273438, -0.11548614501953125, -0.10548782348632812, -0.095489501953125, -0.08549118041992188, -0.07549285888671875, -0.06549453735351562, -0.0554962158203125, -0.045497894287109375, -0.03549957275390625, -0.025501251220703125, -0.0155029296875, -0.005504608154296875, 0.00449371337890625, 0.014492034912109375, 0.0244903564453125, 0.034488677978515625, 0.04448699951171875, 0.054485321044921875, 0.064483642578125, 0.07448196411132812, 0.08448028564453125, 0.09447860717773438, 0.1044769287109375, 0.11447525024414062, 0.12447357177734375, 0.13447189331054688, 0.14447021484375, 0.15446853637695312, 0.16446685791015625, 0.17446517944335938, 0.1844635009765625, 0.19446182250976562, 0.20446014404296875, 0.21445846557617188, 0.224456787109375, 0.23445510864257812, 0.24445343017578125, 0.2544517517089844, 0.2644500732421875, 0.2744483947753906, 0.28444671630859375, 0.2944450378417969, 0.304443359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 5.0, 8.0, 9.0, 12.0, 22.0, 18.0, 17.0, 30.0, 46.0, 44.0, 62.0, 56.0, 57.0, 45.0, 59.0, 75.0, 57.0, 45.0, 44.0, 38.0, 44.0, 44.0, 34.0, 32.0, 23.0, 17.0, 4.0, 10.0, 5.0, 6.0, 2.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00025653839111328125, -0.00024934113025665283, -0.00024214386940002441, -0.000234946608543396, -0.00022774934768676758, -0.00022055208683013916, -0.00021335482597351074, -0.00020615756511688232, -0.0001989603042602539, -0.0001917630434036255, -0.00018456578254699707, -0.00017736852169036865, -0.00017017126083374023, -0.00016297399997711182, -0.0001557767391204834, -0.00014857947826385498, -0.00014138221740722656, -0.00013418495655059814, -0.00012698769569396973, -0.00011979043483734131, -0.00011259317398071289, -0.00010539591312408447, -9.819865226745605e-05, -9.100139141082764e-05, -8.380413055419922e-05, -7.66068696975708e-05, -6.940960884094238e-05, -6.221234798431396e-05, -5.501508712768555e-05, -4.781782627105713e-05, -4.062056541442871e-05, -3.342330455780029e-05, -2.6226043701171875e-05, -1.9028782844543457e-05, -1.1831521987915039e-05, -4.634261131286621e-06, 2.562999725341797e-06, 9.760260581970215e-06, 1.6957521438598633e-05, 2.415478229522705e-05, 3.135204315185547e-05, 3.854930400848389e-05, 4.5746564865112305e-05, 5.294382572174072e-05, 6.014108657836914e-05, 6.733834743499756e-05, 7.453560829162598e-05, 8.17328691482544e-05, 8.893013000488281e-05, 9.612739086151123e-05, 0.00010332465171813965, 0.00011052191257476807, 0.00011771917343139648, 0.0001249164342880249, 0.00013211369514465332, 0.00013931095600128174, 0.00014650821685791016, 0.00015370547771453857, 0.000160902738571167, 0.0001680999994277954, 0.00017529726028442383, 0.00018249452114105225, 0.00018969178199768066, 0.00019688904285430908, 0.0002040863037109375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 8.0, 10.0, 7.0, 14.0, 18.0, 19.0, 36.0, 56.0, 56.0, 76.0, 97.0, 162.0, 245.0, 448.0, 727.0, 5406.0, 984683.0, 54058.0, 986.0, 477.0, 336.0, 191.0, 108.0, 93.0, 63.0, 41.0, 30.0, 17.0, 17.0, 15.0, 14.0, 8.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0036182403564453125, -0.003487497568130493, -0.003356754779815674, -0.0032260119915008545, -0.003095269203186035, -0.002964526414871216, -0.0028337836265563965, -0.002703040838241577, -0.002572298049926758, -0.0024415552616119385, -0.002310812473297119, -0.0021800696849823, -0.0020493268966674805, -0.0019185841083526611, -0.0017878413200378418, -0.0016570985317230225, -0.0015263557434082031, -0.0013956129550933838, -0.0012648701667785645, -0.0011341273784637451, -0.0010033845901489258, -0.0008726418018341064, -0.0007418990135192871, -0.0006111562252044678, -0.00048041343688964844, -0.0003496706485748291, -0.00021892786026000977, -8.818507194519043e-05, 4.2557716369628906e-05, 0.00017330050468444824, 0.0003040432929992676, 0.0004347860813140869, 0.0005655288696289062, 0.0006962716579437256, 0.0008270144462585449, 0.0009577572345733643, 0.0010885000228881836, 0.001219242811203003, 0.0013499855995178223, 0.0014807283878326416, 0.001611471176147461, 0.0017422139644622803, 0.0018729567527770996, 0.002003699541091919, 0.0021344423294067383, 0.0022651851177215576, 0.002395927906036377, 0.0025266706943511963, 0.0026574134826660156, 0.002788156270980835, 0.0029188990592956543, 0.0030496418476104736, 0.003180384635925293, 0.0033111274242401123, 0.0034418702125549316, 0.003572613000869751, 0.0037033557891845703, 0.0038340985774993896, 0.003964841365814209, 0.004095584154129028, 0.004226326942443848, 0.004357069730758667, 0.004487812519073486, 0.004618555307388306, 0.004749298095703125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 16.0, 60.0, 96.0, 145.0, 174.0, 171.0, 154.0, 101.0, 49.0, 18.0, 10.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023732439149171114, -0.00022992145386524498, -0.00022251851623877883, -0.00021511557861231267, -0.00020771264098584652, -0.00020030970335938036, -0.0001929067657329142, -0.00018550382810644805, -0.0001781008904799819, -0.00017069795285351574, -0.0001632950152270496, -0.00015589207760058343, -0.00014848913997411728, -0.00014108620234765112, -0.00013368326472118497, -0.00012628032709471881, -0.00011887740402016789, -0.00011147446639370173, -0.00010407152876723558, -9.666859114076942e-05, -8.926565351430327e-05, -8.186271588783711e-05, -7.445978553732857e-05, -6.705684791086242e-05, -5.965391028439626e-05, -5.2250972657930106e-05, -4.484803503146395e-05, -3.74451010429766e-05, -3.0042163416510448e-05, -2.2639225790044293e-05, -1.5236291801556945e-05, -7.83335417509079e-06, -4.304311005398631e-07, 6.97250561643159e-06, 1.4375442333403043e-05, 2.1778378140879795e-05, 2.918131576734595e-05, 3.6584253393812105e-05, 4.398718738229945e-05, 5.139012500876561e-05, 5.879306263523176e-05, 6.619600026169792e-05, 7.359893788816407e-05, 8.100186823867261e-05, 8.840480586513877e-05, 9.580774349160492e-05, 0.00010321068111807108, 0.00011061361874453723, 0.00011801655637100339, 0.00012541949399746954, 0.0001328224316239357, 0.00014022536925040185, 0.000147628306876868, 0.00015503124450333416, 0.00016243418212980032, 0.00016983711975626647, 0.00017724005738273263, 0.00018464299500919878, 0.00019204593263566494, 0.0001994488702621311, 0.00020685180788859725, 0.0002142547455150634, 0.00022165768314152956, 0.00022906062076799572, 0.00023646354384254664]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 7.0, 15.0, 14.0, 18.0, 17.0, 25.0, 23.0, 18.0, 15.0, 24.0, 32.0, 28.0, 32.0, 44.0, 39.0, 42.0, 40.0, 40.0, 40.0, 42.0, 41.0, 35.0, 34.0, 38.0, 38.0, 21.0, 26.0, 27.0, 22.0, 24.0, 15.0, 14.0, 24.0, 12.0, 9.0, 12.0, 7.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00011795759201049805, -0.0001145070418715477, -0.00011105649173259735, -0.000107605941593647, -0.00010415539145469666, -0.00010070484131574631, -9.725429117679596e-05, -9.380374103784561e-05, -9.035319089889526e-05, -8.690264075994492e-05, -8.345209062099457e-05, -8.000154048204422e-05, -7.655099034309387e-05, -7.310044020414352e-05, -6.964989006519318e-05, -6.619933992624283e-05, -6.274878978729248e-05, -5.929823964834213e-05, -5.5847689509391785e-05, -5.239713937044144e-05, -4.894658923149109e-05, -4.549603909254074e-05, -4.204548895359039e-05, -3.8594938814640045e-05, -3.51443886756897e-05, -3.169383853673935e-05, -2.8243288397789e-05, -2.4792738258838654e-05, -2.1342188119888306e-05, -1.7891637980937958e-05, -1.444108784198761e-05, -1.0990537703037262e-05, -7.539987564086914e-06, -4.089437425136566e-06, -6.388872861862183e-07, 2.8116628527641296e-06, 6.2622129917144775e-06, 9.712763130664825e-06, 1.3163313269615173e-05, 1.661386340856552e-05, 2.006441354751587e-05, 2.3514963686466217e-05, 2.6965513825416565e-05, 3.0416063964366913e-05, 3.386661410331726e-05, 3.731716424226761e-05, 4.0767714381217957e-05, 4.4218264520168304e-05, 4.766881465911865e-05, 5.1119364798069e-05, 5.456991493701935e-05, 5.8020465075969696e-05, 6.147101521492004e-05, 6.492156535387039e-05, 6.837211549282074e-05, 7.182266563177109e-05, 7.527321577072144e-05, 7.872376590967178e-05, 8.217431604862213e-05, 8.562486618757248e-05, 8.907541632652283e-05, 9.252596646547318e-05, 9.597651660442352e-05, 9.942706674337387e-05, 0.00010287761688232422]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 10.0, 15.0, 8.0, 5.0, 8.0, 15.0, 19.0, 21.0, 22.0, 33.0, 20.0, 27.0, 33.0, 26.0, 45.0, 44.0, 44.0, 38.0, 32.0, 44.0, 39.0, 38.0, 38.0, 40.0, 43.0, 31.0, 31.0, 38.0, 25.0, 23.0, 25.0, 8.0, 12.0, 16.0, 13.0, 13.0, 6.0, 8.0, 5.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7421875, -1.6841278076171875, -1.626068115234375, -1.5680084228515625, -1.50994873046875, -1.4518890380859375, -1.393829345703125, -1.3357696533203125, -1.2777099609375, -1.2196502685546875, -1.161590576171875, -1.1035308837890625, -1.04547119140625, -0.9874114990234375, -0.929351806640625, -0.8712921142578125, -0.813232421875, -0.7551727294921875, -0.697113037109375, -0.6390533447265625, -0.58099365234375, -0.5229339599609375, -0.464874267578125, -0.4068145751953125, -0.3487548828125, -0.2906951904296875, -0.232635498046875, -0.1745758056640625, -0.11651611328125, -0.0584564208984375, -0.000396728515625, 0.0576629638671875, 0.11572265625, 0.1737823486328125, 0.231842041015625, 0.2899017333984375, 0.34796142578125, 0.4060211181640625, 0.464080810546875, 0.5221405029296875, 0.5802001953125, 0.6382598876953125, 0.696319580078125, 0.7543792724609375, 0.81243896484375, 0.8704986572265625, 0.928558349609375, 0.9866180419921875, 1.044677734375, 1.1027374267578125, 1.160797119140625, 1.2188568115234375, 1.27691650390625, 1.3349761962890625, 1.393035888671875, 1.4510955810546875, 1.5091552734375, 1.5672149658203125, 1.625274658203125, 1.6833343505859375, 1.74139404296875, 1.7994537353515625, 1.857513427734375, 1.9155731201171875, 1.9736328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 8.0, 4.0, 7.0, 4.0, 16.0, 13.0, 16.0, 21.0, 41.0, 59.0, 89.0, 108.0, 191.0, 292.0, 566.0, 854.0, 1601.0, 2894.0, 5706.0, 11125.0, 24271.0, 59467.0, 170982.0, 382467.0, 242565.0, 83470.0, 31876.0, 14371.0, 7031.0, 3684.0, 2058.0, 1082.0, 629.0, 342.0, 195.0, 119.0, 90.0, 80.0, 45.0, 33.0, 21.0, 20.0, 9.0, 12.0, 4.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-2.2265625, -2.15625, -2.0859375, -2.015625, -1.9453125, -1.875, -1.8046875, -1.734375, -1.6640625, -1.59375, -1.5234375, -1.453125, -1.3828125, -1.3125, -1.2421875, -1.171875, -1.1015625, -1.03125, -0.9609375, -0.890625, -0.8203125, -0.75, -0.6796875, -0.609375, -0.5390625, -0.46875, -0.3984375, -0.328125, -0.2578125, -0.1875, -0.1171875, -0.046875, 0.0234375, 0.09375, 0.1640625, 0.234375, 0.3046875, 0.375, 0.4453125, 0.515625, 0.5859375, 0.65625, 0.7265625, 0.796875, 0.8671875, 0.9375, 1.0078125, 1.078125, 1.1484375, 1.21875, 1.2890625, 1.359375, 1.4296875, 1.5, 1.5703125, 1.640625, 1.7109375, 1.78125, 1.8515625, 1.921875, 1.9921875, 2.0625, 2.1328125, 2.203125, 2.2734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 9.0, 10.0, 14.0, 17.0, 16.0, 25.0, 20.0, 35.0, 38.0, 34.0, 40.0, 62.0, 58.0, 68.0, 147.0, 324.0, 1398.0, 180.0, 88.0, 72.0, 55.0, 49.0, 29.0, 42.0, 31.0, 23.0, 31.0, 20.0, 18.0, 14.0, 13.0, 5.0, 8.0, 6.0, 5.0, 5.0, 6.0, 0.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44140625, -7.2021484375, -6.962890625, -6.7236328125, -6.484375, -6.2451171875, -6.005859375, -5.7666015625, -5.52734375, -5.2880859375, -5.048828125, -4.8095703125, -4.5703125, -4.3310546875, -4.091796875, -3.8525390625, -3.61328125, -3.3740234375, -3.134765625, -2.8955078125, -2.65625, -2.4169921875, -2.177734375, -1.9384765625, -1.69921875, -1.4599609375, -1.220703125, -0.9814453125, -0.7421875, -0.5029296875, -0.263671875, -0.0244140625, 0.21484375, 0.4541015625, 0.693359375, 0.9326171875, 1.171875, 1.4111328125, 1.650390625, 1.8896484375, 2.12890625, 2.3681640625, 2.607421875, 2.8466796875, 3.0859375, 3.3251953125, 3.564453125, 3.8037109375, 4.04296875, 4.2822265625, 4.521484375, 4.7607421875, 5.0, 5.2392578125, 5.478515625, 5.7177734375, 5.95703125, 6.1962890625, 6.435546875, 6.6748046875, 6.9140625, 7.1533203125, 7.392578125, 7.6318359375, 7.87109375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 2.0, 7.0, 17.0, 31.0, 39.0, 60.0, 108.0, 201.0, 422.0, 1783.0, 2646260.0, 494612.0, 1340.0, 364.0, 170.0, 105.0, 58.0, 37.0, 30.0, 12.0, 17.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-47.90625, -46.736083984375, -45.56591796875, -44.395751953125, -43.2255859375, -42.055419921875, -40.88525390625, -39.715087890625, -38.544921875, -37.374755859375, -36.20458984375, -35.034423828125, -33.8642578125, -32.694091796875, -31.52392578125, -30.353759765625, -29.18359375, -28.013427734375, -26.84326171875, -25.673095703125, -24.5029296875, -23.332763671875, -22.16259765625, -20.992431640625, -19.822265625, -18.652099609375, -17.48193359375, -16.311767578125, -15.1416015625, -13.971435546875, -12.80126953125, -11.631103515625, -10.4609375, -9.290771484375, -8.12060546875, -6.950439453125, -5.7802734375, -4.610107421875, -3.43994140625, -2.269775390625, -1.099609375, 0.070556640625, 1.24072265625, 2.410888671875, 3.5810546875, 4.751220703125, 5.92138671875, 7.091552734375, 8.26171875, 9.431884765625, 10.60205078125, 11.772216796875, 12.9423828125, 14.112548828125, 15.28271484375, 16.452880859375, 17.623046875, 18.793212890625, 19.96337890625, 21.133544921875, 22.3037109375, 23.473876953125, 24.64404296875, 25.814208984375, 26.984375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [796.0, 218.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.200349807739258, 0.8117284774780273, 5.8238067626953125, 10.835885047912598, 15.847963333129883, 20.86004066467285, 25.872119903564453, 30.884199142456055, 35.896278381347656, 40.908355712890625, 45.920433044433594, 50.93251419067383, 55.9445915222168, 60.956668853759766, 65.96875, 70.98082733154297, 75.99290466308594, 81.0049819946289, 86.01705932617188, 91.02913665771484, 96.04121398925781, 101.05329895019531, 106.06537628173828, 111.07745361328125, 116.08953094482422, 121.10160827636719, 126.11368560791016, 131.12576293945312, 136.13784790039062, 141.14991760253906, 146.16200256347656, 151.174072265625, 156.1861572265625, 161.1982421875, 166.21031188964844, 171.22239685058594, 176.23446655273438, 181.24655151367188, 186.2586212158203, 191.2707061767578, 196.28277587890625, 201.29486083984375, 206.3069305419922, 211.3190155029297, 216.33108520507812, 221.34317016601562, 226.35523986816406, 231.36732482910156, 236.37940979003906, 241.39149475097656, 246.403564453125, 251.4156494140625, 256.427734375, 261.4397888183594, 266.4518737792969, 271.4639587402344, 276.4760437011719, 281.4881286621094, 286.5002136230469, 291.51226806640625, 296.52435302734375, 301.53643798828125, 306.54852294921875, 311.56060791015625, 316.5726623535156]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 2.0, 4.0, 13.0, 11.0, 13.0, 18.0, 11.0, 15.0, 22.0, 25.0, 28.0, 22.0, 36.0, 37.0, 30.0, 39.0, 29.0, 39.0, 41.0, 39.0, 37.0, 35.0, 36.0, 33.0, 43.0, 38.0, 30.0, 34.0, 31.0, 24.0, 22.0, 24.0, 18.0, 17.0, 14.0, 12.0, 14.0, 12.0, 2.0, 11.0, 9.0, 4.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.929765701293945, -18.370332717895508, -17.81089973449707, -17.25146484375, -16.692031860351562, -16.132598876953125, -15.573165893554688, -15.01373291015625, -14.454298973083496, -13.894865989685059, -13.335432052612305, -12.775999069213867, -12.21656608581543, -11.657132148742676, -11.097699165344238, -10.538265228271484, -9.978832244873047, -9.41939926147461, -8.859965324401855, -8.300532341003418, -7.741098880767822, -7.181665420532227, -6.622232437133789, -6.062798976898193, -5.503365516662598, -4.943932056427002, -4.384498596191406, -3.8250656127929688, -3.265632152557373, -2.7061986923217773, -2.1467654705047607, -1.5873322486877441, -1.0278987884521484, -0.4684654474258423, 0.09096789360046387, 0.65040123462677, 1.2098345756530762, 1.7692680358886719, 2.3287012577056885, 2.888134479522705, 3.447567939758301, 4.0070013999938965, 4.566434860229492, 5.12586784362793, 5.685301303863525, 6.244734764099121, 6.804167747497559, 7.363601207733154, 7.92303466796875, 8.482467651367188, 9.041901588439941, 9.601334571838379, 10.160768508911133, 10.72020149230957, 11.279634475708008, 11.839067459106445, 12.3985013961792, 12.957934379577637, 13.51736831665039, 14.076801300048828, 14.636234283447266, 15.19566822052002, 15.755101203918457, 16.31453514099121, 16.87396812438965]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 13.0, 11.0, 13.0, 14.0, 20.0, 12.0, 31.0, 16.0, 26.0, 24.0, 29.0, 28.0, 34.0, 45.0, 35.0, 38.0, 30.0, 37.0, 39.0, 46.0, 32.0, 36.0, 48.0, 38.0, 34.0, 32.0, 27.0, 34.0, 18.0, 20.0, 19.0, 18.0, 8.0, 12.0, 13.0, 9.0, 4.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8095703125, -1.7487945556640625, -1.688018798828125, -1.6272430419921875, -1.56646728515625, -1.5056915283203125, -1.444915771484375, -1.3841400146484375, -1.3233642578125, -1.2625885009765625, -1.201812744140625, -1.1410369873046875, -1.08026123046875, -1.0194854736328125, -0.958709716796875, -0.8979339599609375, -0.837158203125, -0.7763824462890625, -0.715606689453125, -0.6548309326171875, -0.59405517578125, -0.5332794189453125, -0.472503662109375, -0.4117279052734375, -0.3509521484375, -0.2901763916015625, -0.229400634765625, -0.1686248779296875, -0.10784912109375, -0.0470733642578125, 0.013702392578125, 0.0744781494140625, 0.13525390625, 0.1960296630859375, 0.256805419921875, 0.3175811767578125, 0.37835693359375, 0.4391326904296875, 0.499908447265625, 0.5606842041015625, 0.6214599609375, 0.6822357177734375, 0.743011474609375, 0.8037872314453125, 0.86456298828125, 0.9253387451171875, 0.986114501953125, 1.0468902587890625, 1.107666015625, 1.1684417724609375, 1.229217529296875, 1.2899932861328125, 1.35076904296875, 1.4115447998046875, 1.472320556640625, 1.5330963134765625, 1.5938720703125, 1.6546478271484375, 1.715423583984375, 1.7761993408203125, 1.83697509765625, 1.8977508544921875, 1.958526611328125, 2.0193023681640625, 2.080078125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 0.0, 4.0, 15.0, 13.0, 13.0, 9.0, 17.0, 15.0, 18.0, 27.0, 40.0, 36.0, 47.0, 63.0, 84.0, 77.0, 112.0, 202.0, 393.0, 1331.0, 15589.0, 944079.0, 3130760.0, 96166.0, 3589.0, 620.0, 260.0, 145.0, 106.0, 96.0, 59.0, 54.0, 43.0, 30.0, 29.0, 16.0, 19.0, 23.0, 21.0, 13.0, 9.0, 10.0, 5.0, 3.0, 4.0, 2.0, 7.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.29443359375, -8.0107421875, -7.72705078125, -7.443359375, -7.15966796875, -6.8759765625, -6.59228515625, -6.30859375, -6.02490234375, -5.7412109375, -5.45751953125, -5.173828125, -4.89013671875, -4.6064453125, -4.32275390625, -4.0390625, -3.75537109375, -3.4716796875, -3.18798828125, -2.904296875, -2.62060546875, -2.3369140625, -2.05322265625, -1.76953125, -1.48583984375, -1.2021484375, -0.91845703125, -0.634765625, -0.35107421875, -0.0673828125, 0.21630859375, 0.5, 0.78369140625, 1.0673828125, 1.35107421875, 1.634765625, 1.91845703125, 2.2021484375, 2.48583984375, 2.76953125, 3.05322265625, 3.3369140625, 3.62060546875, 3.904296875, 4.18798828125, 4.4716796875, 4.75537109375, 5.0390625, 5.32275390625, 5.6064453125, 5.89013671875, 6.173828125, 6.45751953125, 6.7412109375, 7.02490234375, 7.30859375, 7.59228515625, 7.8759765625, 8.15966796875, 8.443359375, 8.72705078125, 9.0107421875, 9.29443359375, 9.578125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 9.0, 19.0, 26.0, 28.0, 45.0, 56.0, 88.0, 122.0, 178.0, 239.0, 341.0, 414.0, 480.0, 468.0, 407.0, 320.0, 231.0, 172.0, 137.0, 84.0, 61.0, 39.0, 35.0, 15.0, 15.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.84375, -5.67138671875, -5.4990234375, -5.32666015625, -5.154296875, -4.98193359375, -4.8095703125, -4.63720703125, -4.46484375, -4.29248046875, -4.1201171875, -3.94775390625, -3.775390625, -3.60302734375, -3.4306640625, -3.25830078125, -3.0859375, -2.91357421875, -2.7412109375, -2.56884765625, -2.396484375, -2.22412109375, -2.0517578125, -1.87939453125, -1.70703125, -1.53466796875, -1.3623046875, -1.18994140625, -1.017578125, -0.84521484375, -0.6728515625, -0.50048828125, -0.328125, -0.15576171875, 0.0166015625, 0.18896484375, 0.361328125, 0.53369140625, 0.7060546875, 0.87841796875, 1.05078125, 1.22314453125, 1.3955078125, 1.56787109375, 1.740234375, 1.91259765625, 2.0849609375, 2.25732421875, 2.4296875, 2.60205078125, 2.7744140625, 2.94677734375, 3.119140625, 3.29150390625, 3.4638671875, 3.63623046875, 3.80859375, 3.98095703125, 4.1533203125, 4.32568359375, 4.498046875, 4.67041015625, 4.8427734375, 5.01513671875, 5.1875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 17.0, 12.0, 23.0, 34.0, 56.0, 76.0, 96.0, 115.0, 206.0, 277.0, 506.0, 1288.0, 9381.0, 457966.0, 3587997.0, 129679.0, 4420.0, 909.0, 412.0, 247.0, 154.0, 97.0, 83.0, 63.0, 53.0, 32.0, 23.0, 12.0, 10.0, 15.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.78125, -13.3272705078125, -12.873291015625, -12.4193115234375, -11.96533203125, -11.5113525390625, -11.057373046875, -10.6033935546875, -10.1494140625, -9.6954345703125, -9.241455078125, -8.7874755859375, -8.33349609375, -7.8795166015625, -7.425537109375, -6.9715576171875, -6.517578125, -6.0635986328125, -5.609619140625, -5.1556396484375, -4.70166015625, -4.2476806640625, -3.793701171875, -3.3397216796875, -2.8857421875, -2.4317626953125, -1.977783203125, -1.5238037109375, -1.06982421875, -0.6158447265625, -0.161865234375, 0.2921142578125, 0.74609375, 1.2000732421875, 1.654052734375, 2.1080322265625, 2.56201171875, 3.0159912109375, 3.469970703125, 3.9239501953125, 4.3779296875, 4.8319091796875, 5.285888671875, 5.7398681640625, 6.19384765625, 6.6478271484375, 7.101806640625, 7.5557861328125, 8.009765625, 8.4637451171875, 8.917724609375, 9.3717041015625, 9.82568359375, 10.2796630859375, 10.733642578125, 11.1876220703125, 11.6416015625, 12.0955810546875, 12.549560546875, 13.0035400390625, 13.45751953125, 13.9114990234375, 14.365478515625, 14.8194580078125, 15.2734375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 74.0, 564.0, 351.0, 24.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.5766143798828, -202.94308471679688, -198.30955505371094, -193.676025390625, -189.04251098632812, -184.4089813232422, -179.77545166015625, -175.1419219970703, -170.50839233398438, -165.87486267089844, -161.2413330078125, -156.60780334472656, -151.97427368164062, -147.34075927734375, -142.7072296142578, -138.07369995117188, -133.44017028808594, -128.806640625, -124.17311096191406, -119.53958892822266, -114.90605926513672, -110.27252960205078, -105.63900756835938, -101.00547790527344, -96.3719482421875, -91.73841857910156, -87.10488891601562, -82.47136688232422, -77.83783721923828, -73.20430755615234, -68.57078552246094, -63.937255859375, -59.30372619628906, -54.670196533203125, -50.03667068481445, -45.40314483642578, -40.769615173339844, -36.136085510253906, -31.502559661865234, -26.869033813476562, -22.235504150390625, -17.60197639465332, -12.968448638916016, -8.334920883178711, -3.7013931274414062, 0.9321346282958984, 5.565662384033203, 10.199188232421875, 14.832717895507812, 19.466245651245117, 24.099773406982422, 28.733301162719727, 33.36682891845703, 38.00035858154297, 42.63388442993164, 47.26741027832031, 51.90093994140625, 56.53446960449219, 61.16799545288086, 65.80152130126953, 70.43505096435547, 75.0685806274414, 79.70210266113281, 84.33563232421875, 88.96916198730469]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 12.0, 5.0, 8.0, 13.0, 17.0, 17.0, 11.0, 15.0, 16.0, 23.0, 28.0, 20.0, 26.0, 24.0, 38.0, 32.0, 40.0, 41.0, 45.0, 46.0, 43.0, 37.0, 38.0, 38.0, 38.0, 38.0, 42.0, 26.0, 27.0, 25.0, 22.0, 18.0, 27.0, 15.0, 11.0, 17.0, 12.0, 8.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.296612739562988, -13.795836448669434, -13.295059204101562, -12.794282913208008, -12.293505668640137, -11.792729377746582, -11.291952133178711, -10.791175842285156, -10.290399551391602, -9.789623260498047, -9.288846015930176, -8.788069725036621, -8.28729248046875, -7.786516189575195, -7.285739421844482, -6.7849626541137695, -6.284185409545898, -5.7834086418151855, -5.282631874084473, -4.781855583190918, -4.281078338623047, -3.780301809310913, -3.2795252799987793, -2.7787485122680664, -2.2779717445373535, -1.7771949768066406, -1.2764183282852173, -0.775641679763794, -0.27486491203308105, 0.22591185569763184, 0.7266883850097656, 1.2274651527404785, 1.7282428741455078, 2.2290196418762207, 2.7297964096069336, 3.2305729389190674, 3.7313497066497803, 4.232126235961914, 4.732903003692627, 5.23367977142334, 5.734456539154053, 6.235233306884766, 6.7360100746154785, 7.236786842346191, 7.737563133239746, 8.238340377807617, 8.739116668701172, 9.239892959594727, 9.740670204162598, 10.241446495056152, 10.742223739624023, 11.243000030517578, 11.74377727508545, 12.244553565979004, 12.745330810546875, 13.24610710144043, 13.746883392333984, 14.247659683227539, 14.74843692779541, 15.249213218688965, 15.749990463256836, 16.25076675415039, 16.751543045043945, 17.2523193359375, 17.753097534179688]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 11.0, 10.0, 6.0, 5.0, 16.0, 13.0, 16.0, 17.0, 19.0, 24.0, 20.0, 24.0, 34.0, 32.0, 37.0, 44.0, 30.0, 29.0, 40.0, 53.0, 49.0, 33.0, 31.0, 62.0, 40.0, 31.0, 32.0, 34.0, 34.0, 19.0, 24.0, 21.0, 19.0, 16.0, 13.0, 11.0, 7.0, 7.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.88671875, -1.821563720703125, -1.75640869140625, -1.691253662109375, -1.6260986328125, -1.560943603515625, -1.49578857421875, -1.430633544921875, -1.365478515625, -1.300323486328125, -1.23516845703125, -1.170013427734375, -1.1048583984375, -1.039703369140625, -0.97454833984375, -0.909393310546875, -0.84423828125, -0.779083251953125, -0.71392822265625, -0.648773193359375, -0.5836181640625, -0.518463134765625, -0.45330810546875, -0.388153076171875, -0.322998046875, -0.257843017578125, -0.19268798828125, -0.127532958984375, -0.0623779296875, 0.002777099609375, 0.06793212890625, 0.133087158203125, 0.1982421875, 0.263397216796875, 0.32855224609375, 0.393707275390625, 0.4588623046875, 0.524017333984375, 0.58917236328125, 0.654327392578125, 0.719482421875, 0.784637451171875, 0.84979248046875, 0.914947509765625, 0.9801025390625, 1.045257568359375, 1.11041259765625, 1.175567626953125, 1.24072265625, 1.305877685546875, 1.37103271484375, 1.436187744140625, 1.5013427734375, 1.566497802734375, 1.63165283203125, 1.696807861328125, 1.761962890625, 1.827117919921875, 1.89227294921875, 1.957427978515625, 2.0225830078125, 2.087738037109375, 2.15289306640625, 2.218048095703125, 2.283203125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 14.0, 24.0, 28.0, 40.0, 51.0, 109.0, 144.0, 200.0, 320.0, 452.0, 694.0, 942.0, 1425.0, 2012.0, 3074.0, 4442.0, 6586.0, 10091.0, 15605.0, 24442.0, 40073.0, 69895.0, 134757.0, 296781.0, 199650.0, 95370.0, 52828.0, 31236.0, 19591.0, 12445.0, 8223.0, 5515.0, 3688.0, 2412.0, 1752.0, 1139.0, 781.0, 555.0, 342.0, 281.0, 172.0, 112.0, 86.0, 64.0, 33.0, 28.0, 11.0, 11.0, 9.0, 8.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.41845703125, -0.40605926513671875, -0.3936614990234375, -0.38126373291015625, -0.368865966796875, -0.35646820068359375, -0.3440704345703125, -0.33167266845703125, -0.31927490234375, -0.30687713623046875, -0.2944793701171875, -0.28208160400390625, -0.269683837890625, -0.25728607177734375, -0.2448883056640625, -0.23249053955078125, -0.2200927734375, -0.20769500732421875, -0.1952972412109375, -0.18289947509765625, -0.170501708984375, -0.15810394287109375, -0.1457061767578125, -0.13330841064453125, -0.12091064453125, -0.10851287841796875, -0.0961151123046875, -0.08371734619140625, -0.071319580078125, -0.05892181396484375, -0.0465240478515625, -0.03412628173828125, -0.021728515625, -0.00933074951171875, 0.0030670166015625, 0.01546478271484375, 0.027862548828125, 0.04026031494140625, 0.0526580810546875, 0.06505584716796875, 0.07745361328125, 0.08985137939453125, 0.1022491455078125, 0.11464691162109375, 0.127044677734375, 0.13944244384765625, 0.1518402099609375, 0.16423797607421875, 0.1766357421875, 0.18903350830078125, 0.2014312744140625, 0.21382904052734375, 0.226226806640625, 0.23862457275390625, 0.2510223388671875, 0.26342010498046875, 0.27581787109375, 0.28821563720703125, 0.3006134033203125, 0.31301116943359375, 0.325408935546875, 0.33780670166015625, 0.3502044677734375, 0.36260223388671875, 0.375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 8.0, 3.0, 4.0, 17.0, 13.0, 17.0, 16.0, 15.0, 16.0, 24.0, 43.0, 33.0, 30.0, 30.0, 37.0, 31.0, 43.0, 45.0, 39.0, 1064.0, 31.0, 45.0, 33.0, 38.0, 57.0, 27.0, 40.0, 30.0, 31.0, 27.0, 20.0, 24.0, 14.0, 11.0, 21.0, 6.0, 7.0, 6.0, 11.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.318359375, -1.2742919921875, -1.230224609375, -1.1861572265625, -1.14208984375, -1.0980224609375, -1.053955078125, -1.0098876953125, -0.9658203125, -0.9217529296875, -0.877685546875, -0.8336181640625, -0.78955078125, -0.7454833984375, -0.701416015625, -0.6573486328125, -0.61328125, -0.5692138671875, -0.525146484375, -0.4810791015625, -0.43701171875, -0.3929443359375, -0.348876953125, -0.3048095703125, -0.2607421875, -0.2166748046875, -0.172607421875, -0.1285400390625, -0.08447265625, -0.0404052734375, 0.003662109375, 0.0477294921875, 0.091796875, 0.1358642578125, 0.179931640625, 0.2239990234375, 0.26806640625, 0.3121337890625, 0.356201171875, 0.4002685546875, 0.4443359375, 0.4884033203125, 0.532470703125, 0.5765380859375, 0.62060546875, 0.6646728515625, 0.708740234375, 0.7528076171875, 0.796875, 0.8409423828125, 0.885009765625, 0.9290771484375, 0.97314453125, 1.0172119140625, 1.061279296875, 1.1053466796875, 1.1494140625, 1.1934814453125, 1.237548828125, 1.2816162109375, 1.32568359375, 1.3697509765625, 1.413818359375, 1.4578857421875, 1.501953125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 14.0, 19.0, 26.0, 32.0, 55.0, 75.0, 117.0, 163.0, 267.0, 330.0, 553.0, 757.0, 1044.0, 1630.0, 2485.0, 3699.0, 5658.0, 8495.0, 13580.0, 21556.0, 35388.0, 60776.0, 109978.0, 229462.0, 1309848.0, 120548.0, 66201.0, 38956.0, 23437.0, 14610.0, 9330.0, 5975.0, 3916.0, 2671.0, 1770.0, 1231.0, 813.0, 520.0, 361.0, 255.0, 164.0, 117.0, 82.0, 60.0, 33.0, 28.0, 12.0, 11.0, 11.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3490791320800781, -0.33707427978515625, -0.3250694274902344, -0.3130645751953125, -0.3010597229003906, -0.28905487060546875, -0.2770500183105469, -0.265045166015625, -0.2530403137207031, -0.24103546142578125, -0.22903060913085938, -0.2170257568359375, -0.20502090454101562, -0.19301605224609375, -0.18101119995117188, -0.16900634765625, -0.15700149536132812, -0.14499664306640625, -0.13299179077148438, -0.1209869384765625, -0.10898208618164062, -0.09697723388671875, -0.08497238159179688, -0.072967529296875, -0.060962677001953125, -0.04895782470703125, -0.036952972412109375, -0.0249481201171875, -0.012943267822265625, -0.00093841552734375, 0.011066436767578125, 0.0230712890625, 0.035076141357421875, 0.04708099365234375, 0.059085845947265625, 0.0710906982421875, 0.08309555053710938, 0.09510040283203125, 0.10710525512695312, 0.119110107421875, 0.13111495971679688, 0.14311981201171875, 0.15512466430664062, 0.1671295166015625, 0.17913436889648438, 0.19113922119140625, 0.20314407348632812, 0.21514892578125, 0.22715377807617188, 0.23915863037109375, 0.2511634826660156, 0.2631683349609375, 0.2751731872558594, 0.28717803955078125, 0.2991828918457031, 0.311187744140625, 0.3231925964355469, 0.33519744873046875, 0.3472023010253906, 0.3592071533203125, 0.3712120056152344, 0.38321685791015625, 0.3952217102050781, 0.4072265625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 5.0, 6.0, 7.0, 15.0, 21.0, 23.0, 24.0, 23.0, 21.0, 30.0, 39.0, 45.0, 46.0, 49.0, 56.0, 55.0, 71.0, 44.0, 59.0, 42.0, 36.0, 42.0, 33.0, 30.0, 22.0, 25.0, 21.0, 16.0, 15.0, 14.0, 7.0, 8.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.00023508071899414062, -0.00022794120013713837, -0.0002208016812801361, -0.00021366216242313385, -0.0002065226435661316, -0.00019938312470912933, -0.00019224360585212708, -0.00018510408699512482, -0.00017796456813812256, -0.0001708250492811203, -0.00016368553042411804, -0.00015654601156711578, -0.00014940649271011353, -0.00014226697385311127, -0.000135127454996109, -0.00012798793613910675, -0.00012084841728210449, -0.00011370889842510223, -0.00010656937956809998, -9.942986071109772e-05, -9.229034185409546e-05, -8.51508229970932e-05, -7.801130414009094e-05, -7.087178528308868e-05, -6.373226642608643e-05, -5.659274756908417e-05, -4.945322871208191e-05, -4.231370985507965e-05, -3.517419099807739e-05, -2.8034672141075134e-05, -2.0895153284072876e-05, -1.3755634427070618e-05, -6.616115570068359e-06, 5.234032869338989e-07, 7.662922143936157e-06, 1.4802441000938416e-05, 2.1941959857940674e-05, 2.9081478714942932e-05, 3.622099757194519e-05, 4.336051642894745e-05, 5.050003528594971e-05, 5.7639554142951965e-05, 6.477907299995422e-05, 7.191859185695648e-05, 7.905811071395874e-05, 8.6197629570961e-05, 9.333714842796326e-05, 0.00010047666728496552, 0.00010761618614196777, 0.00011475570499897003, 0.00012189522385597229, 0.00012903474271297455, 0.0001361742615699768, 0.00014331378042697906, 0.00015045329928398132, 0.00015759281814098358, 0.00016473233699798584, 0.0001718718558549881, 0.00017901137471199036, 0.00018615089356899261, 0.00019329041242599487, 0.00020042993128299713, 0.0002075694501399994, 0.00021470896899700165, 0.0002218484878540039]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 7.0, 16.0, 12.0, 25.0, 19.0, 28.0, 41.0, 52.0, 81.0, 99.0, 133.0, 224.0, 350.0, 603.0, 1453.0, 307681.0, 733709.0, 2137.0, 673.0, 385.0, 247.0, 172.0, 106.0, 68.0, 57.0, 46.0, 35.0, 22.0, 13.0, 10.0, 11.0, 12.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004329681396484375, -0.004185795783996582, -0.004041910171508789, -0.003898024559020996, -0.003754138946533203, -0.00361025333404541, -0.003466367721557617, -0.0033224821090698242, -0.0031785964965820312, -0.0030347108840942383, -0.0028908252716064453, -0.0027469396591186523, -0.0026030540466308594, -0.0024591684341430664, -0.0023152828216552734, -0.0021713972091674805, -0.0020275115966796875, -0.0018836259841918945, -0.0017397403717041016, -0.0015958547592163086, -0.0014519691467285156, -0.0013080835342407227, -0.0011641979217529297, -0.0010203123092651367, -0.0008764266967773438, -0.0007325410842895508, -0.0005886554718017578, -0.00044476985931396484, -0.0003008842468261719, -0.0001569986343383789, -1.3113021850585938e-05, 0.00013077259063720703, 0.000274658203125, 0.00041854381561279297, 0.0005624294281005859, 0.0007063150405883789, 0.0008502006530761719, 0.0009940862655639648, 0.0011379718780517578, 0.0012818574905395508, 0.0014257431030273438, 0.0015696287155151367, 0.0017135143280029297, 0.0018573999404907227, 0.0020012855529785156, 0.0021451711654663086, 0.0022890567779541016, 0.0024329423904418945, 0.0025768280029296875, 0.0027207136154174805, 0.0028645992279052734, 0.0030084848403930664, 0.0031523704528808594, 0.0032962560653686523, 0.0034401416778564453, 0.0035840272903442383, 0.0037279129028320312, 0.0038717985153198242, 0.004015684127807617, 0.00415956974029541, 0.004303455352783203, 0.004447340965270996, 0.004591226577758789, 0.004735112190246582, 0.004878997802734375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 10.0, 29.0, 69.0, 129.0, 166.0, 217.0, 169.0, 114.0, 68.0, 24.0, 14.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002702518249861896, -0.00026107270969077945, -0.0002518935943953693, -0.00024271449365187436, -0.00023353539290837944, -0.00022435627761296928, -0.00021517716231755912, -0.00020599804702214897, -0.00019681894627865404, -0.00018763983098324388, -0.00017846073023974895, -0.0001692816149443388, -0.00016010249964892864, -0.00015092339890543371, -0.00014174428361002356, -0.00013256518286652863, -0.00012338606757111847, -0.00011420695955166593, -0.00010502785153221339, -9.584873623680323e-05, -8.666962821735069e-05, -7.749052019789815e-05, -6.8311404902488e-05, -5.913229688303545e-05, -4.995318886358291e-05, -4.077408084413037e-05, -3.159496918669902e-05, -2.2415859348257072e-05, -1.3236749509815127e-05, -4.057641490362585e-06, 5.1214701670687646e-06, 1.4300581824500114e-05, 2.3479689843952656e-05, 3.26587978634052e-05, 4.183790952083655e-05, 5.1017021178267896e-05, 6.019612919772044e-05, 6.937523721717298e-05, 7.855435251258314e-05, 8.773346053203568e-05, 9.691256855148822e-05, 0.00010609167657094076, 0.0001152707845903933, 0.00012444989988580346, 0.00013362901518121362, 0.00014280811592470855, 0.0001519872312201187, 0.00016116633196361363, 0.00017034544725902379, 0.00017952456255443394, 0.00018870366329792887, 0.00019788277859333903, 0.00020706187933683395, 0.0002162409946322441, 0.00022542010992765427, 0.00023459922522306442, 0.00024377832596655935, 0.0002529574267100543, 0.00026213654200546443, 0.0002713156573008746, 0.00028049477259628475, 0.00028967385878786445, 0.0002988529740832746, 0.00030803208937868476, 0.0003172112046740949]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 8.0, 3.0, 4.0, 13.0, 5.0, 7.0, 14.0, 21.0, 26.0, 8.0, 19.0, 20.0, 27.0, 19.0, 32.0, 21.0, 28.0, 21.0, 37.0, 42.0, 34.0, 35.0, 39.0, 40.0, 35.0, 32.0, 32.0, 42.0, 37.0, 34.0, 22.0, 27.0, 27.0, 10.0, 23.0, 21.0, 19.0, 21.0, 15.0, 8.0, 11.0, 15.0, 11.0, 4.0, 3.0, 7.0, 7.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00011897087097167969, -0.0001154458150267601, -0.00011192075908184052, -0.00010839570313692093, -0.00010487064719200134, -0.00010134559124708176, -9.782053530216217e-05, -9.429547935724258e-05, -9.0770423412323e-05, -8.724536746740341e-05, -8.372031152248383e-05, -8.019525557756424e-05, -7.667019963264465e-05, -7.314514368772507e-05, -6.962008774280548e-05, -6.60950317978859e-05, -6.256997585296631e-05, -5.904491990804672e-05, -5.5519863963127136e-05, -5.199480801820755e-05, -4.8469752073287964e-05, -4.494469612836838e-05, -4.141964018344879e-05, -3.7894584238529205e-05, -3.436952829360962e-05, -3.084447234869003e-05, -2.7319416403770447e-05, -2.379436045885086e-05, -2.0269304513931274e-05, -1.6744248569011688e-05, -1.3219192624092102e-05, -9.694136679172516e-06, -6.16908073425293e-06, -2.6440247893333435e-06, 8.810311555862427e-07, 4.406087100505829e-06, 7.931143045425415e-06, 1.1456198990345001e-05, 1.4981254935264587e-05, 1.8506310880184174e-05, 2.203136682510376e-05, 2.5556422770023346e-05, 2.9081478714942932e-05, 3.260653465986252e-05, 3.6131590604782104e-05, 3.965664654970169e-05, 4.318170249462128e-05, 4.670675843954086e-05, 5.023181438446045e-05, 5.3756870329380035e-05, 5.728192627429962e-05, 6.080698221921921e-05, 6.43320381641388e-05, 6.785709410905838e-05, 7.138215005397797e-05, 7.490720599889755e-05, 7.843226194381714e-05, 8.195731788873672e-05, 8.548237383365631e-05, 8.90074297785759e-05, 9.253248572349548e-05, 9.605754166841507e-05, 9.958259761333466e-05, 0.00010310765355825424, 0.00010663270950317383]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 11.0, 10.0, 6.0, 5.0, 16.0, 13.0, 16.0, 17.0, 19.0, 24.0, 20.0, 24.0, 34.0, 32.0, 37.0, 44.0, 30.0, 29.0, 40.0, 53.0, 49.0, 33.0, 31.0, 62.0, 40.0, 31.0, 32.0, 34.0, 34.0, 19.0, 24.0, 21.0, 19.0, 16.0, 13.0, 11.0, 7.0, 7.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.88671875, -1.821563720703125, -1.75640869140625, -1.691253662109375, -1.6260986328125, -1.560943603515625, -1.49578857421875, -1.430633544921875, -1.365478515625, -1.300323486328125, -1.23516845703125, -1.170013427734375, -1.1048583984375, -1.039703369140625, -0.97454833984375, -0.909393310546875, -0.84423828125, -0.779083251953125, -0.71392822265625, -0.648773193359375, -0.5836181640625, -0.518463134765625, -0.45330810546875, -0.388153076171875, -0.322998046875, -0.257843017578125, -0.19268798828125, -0.127532958984375, -0.0623779296875, 0.002777099609375, 0.06793212890625, 0.133087158203125, 0.1982421875, 0.263397216796875, 0.32855224609375, 0.393707275390625, 0.4588623046875, 0.524017333984375, 0.58917236328125, 0.654327392578125, 0.719482421875, 0.784637451171875, 0.84979248046875, 0.914947509765625, 0.9801025390625, 1.045257568359375, 1.11041259765625, 1.175567626953125, 1.24072265625, 1.305877685546875, 1.37103271484375, 1.436187744140625, 1.5013427734375, 1.566497802734375, 1.63165283203125, 1.696807861328125, 1.761962890625, 1.827117919921875, 1.89227294921875, 1.957427978515625, 2.0225830078125, 2.087738037109375, 2.15289306640625, 2.218048095703125, 2.283203125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 5.0, 6.0, 16.0, 12.0, 12.0, 19.0, 32.0, 58.0, 77.0, 110.0, 184.0, 276.0, 443.0, 773.0, 1291.0, 2583.0, 4604.0, 8163.0, 14784.0, 26778.0, 48868.0, 97813.0, 218782.0, 302176.0, 160426.0, 73923.0, 38330.0, 21185.0, 11916.0, 6485.0, 3614.0, 1970.0, 1077.0, 633.0, 382.0, 229.0, 151.0, 112.0, 64.0, 45.0, 36.0, 28.0, 15.0, 17.0, 14.0, 4.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.7490234375, -1.69488525390625, -1.6407470703125, -1.58660888671875, -1.532470703125, -1.47833251953125, -1.4241943359375, -1.37005615234375, -1.31591796875, -1.26177978515625, -1.2076416015625, -1.15350341796875, -1.099365234375, -1.04522705078125, -0.9910888671875, -0.93695068359375, -0.8828125, -0.82867431640625, -0.7745361328125, -0.72039794921875, -0.666259765625, -0.61212158203125, -0.5579833984375, -0.50384521484375, -0.44970703125, -0.39556884765625, -0.3414306640625, -0.28729248046875, -0.233154296875, -0.17901611328125, -0.1248779296875, -0.07073974609375, -0.0166015625, 0.03753662109375, 0.0916748046875, 0.14581298828125, 0.199951171875, 0.25408935546875, 0.3082275390625, 0.36236572265625, 0.41650390625, 0.47064208984375, 0.5247802734375, 0.57891845703125, 0.633056640625, 0.68719482421875, 0.7413330078125, 0.79547119140625, 0.849609375, 0.90374755859375, 0.9578857421875, 1.01202392578125, 1.066162109375, 1.12030029296875, 1.1744384765625, 1.22857666015625, 1.28271484375, 1.33685302734375, 1.3909912109375, 1.44512939453125, 1.499267578125, 1.55340576171875, 1.6075439453125, 1.66168212890625, 1.7158203125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 9.0, 6.0, 7.0, 15.0, 16.0, 13.0, 19.0, 19.0, 24.0, 22.0, 32.0, 41.0, 39.0, 35.0, 41.0, 55.0, 65.0, 147.0, 363.0, 1406.0, 174.0, 69.0, 52.0, 48.0, 38.0, 41.0, 39.0, 26.0, 26.0, 21.0, 22.0, 20.0, 16.0, 13.0, 11.0, 8.0, 9.0, 9.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.7578125, -8.50787353515625, -8.2579345703125, -8.00799560546875, -7.758056640625, -7.50811767578125, -7.2581787109375, -7.00823974609375, -6.75830078125, -6.50836181640625, -6.2584228515625, -6.00848388671875, -5.758544921875, -5.50860595703125, -5.2586669921875, -5.00872802734375, -4.7587890625, -4.50885009765625, -4.2589111328125, -4.00897216796875, -3.759033203125, -3.50909423828125, -3.2591552734375, -3.00921630859375, -2.75927734375, -2.50933837890625, -2.2593994140625, -2.00946044921875, -1.759521484375, -1.50958251953125, -1.2596435546875, -1.00970458984375, -0.759765625, -0.50982666015625, -0.2598876953125, -0.00994873046875, 0.239990234375, 0.48992919921875, 0.7398681640625, 0.98980712890625, 1.23974609375, 1.48968505859375, 1.7396240234375, 1.98956298828125, 2.239501953125, 2.48944091796875, 2.7393798828125, 2.98931884765625, 3.2392578125, 3.48919677734375, 3.7391357421875, 3.98907470703125, 4.239013671875, 4.48895263671875, 4.7388916015625, 4.98883056640625, 5.23876953125, 5.48870849609375, 5.7386474609375, 5.98858642578125, 6.238525390625, 6.48846435546875, 6.7384033203125, 6.98834228515625, 7.23828125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 8.0, 10.0, 5.0, 13.0, 13.0, 15.0, 17.0, 28.0, 33.0, 45.0, 69.0, 83.0, 125.0, 227.0, 397.0, 922.0, 11733.0, 3095074.0, 34483.0, 1208.0, 427.0, 229.0, 148.0, 87.0, 74.0, 44.0, 32.0, 29.0, 34.0, 14.0, 13.0, 8.0, 5.0, 9.0, 7.0, 4.0, 5.0, 3.0, 5.0, 0.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.59375, -27.716552734375, -26.83935546875, -25.962158203125, -25.0849609375, -24.207763671875, -23.33056640625, -22.453369140625, -21.576171875, -20.698974609375, -19.82177734375, -18.944580078125, -18.0673828125, -17.190185546875, -16.31298828125, -15.435791015625, -14.55859375, -13.681396484375, -12.80419921875, -11.927001953125, -11.0498046875, -10.172607421875, -9.29541015625, -8.418212890625, -7.541015625, -6.663818359375, -5.78662109375, -4.909423828125, -4.0322265625, -3.155029296875, -2.27783203125, -1.400634765625, -0.5234375, 0.353759765625, 1.23095703125, 2.108154296875, 2.9853515625, 3.862548828125, 4.73974609375, 5.616943359375, 6.494140625, 7.371337890625, 8.24853515625, 9.125732421875, 10.0029296875, 10.880126953125, 11.75732421875, 12.634521484375, 13.51171875, 14.388916015625, 15.26611328125, 16.143310546875, 17.0205078125, 17.897705078125, 18.77490234375, 19.652099609375, 20.529296875, 21.406494140625, 22.28369140625, 23.160888671875, 24.0380859375, 24.915283203125, 25.79248046875, 26.669677734375, 27.546875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 25.0, 33.0, 60.0, 99.0, 115.0, 149.0, 142.0, 133.0, 91.0, 72.0, 38.0, 16.0, 8.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.52664566040039, -14.085351943969727, -13.644058227539062, -13.202764511108398, -12.761470794677734, -12.32017707824707, -11.878883361816406, -11.437589645385742, -10.996295928955078, -10.555002212524414, -10.11370849609375, -9.672414779663086, -9.231121063232422, -8.789827346801758, -8.348533630371094, -7.9072394371032715, -7.465945243835449, -7.024651527404785, -6.583357810974121, -6.142064094543457, -5.700770378112793, -5.259476661682129, -4.818182468414307, -4.376888751983643, -3.9355950355529785, -3.4943013191223145, -3.0530076026916504, -2.6117136478424072, -2.170419931411743, -1.729126214981079, -1.287832260131836, -0.8465385437011719, -0.4052457809448242, 0.03604799509048462, 0.47734177112579346, 0.9186356067657471, 1.3599293231964111, 1.8012230396270752, 2.2425169944763184, 2.6838107109069824, 3.1251044273376465, 3.5663981437683105, 4.007691860198975, 4.448986053466797, 4.890279769897461, 5.331573486328125, 5.772867202758789, 6.214160919189453, 6.655454635620117, 7.096748352050781, 7.538042068481445, 7.979335784912109, 8.420629501342773, 8.861923217773438, 9.303216934204102, 9.744510650634766, 10.18580436706543, 10.627098083496094, 11.068391799926758, 11.509685516357422, 11.950979232788086, 12.39227294921875, 12.833566665649414, 13.274860382080078, 13.716155052185059]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 15.0, 10.0, 7.0, 22.0, 23.0, 19.0, 22.0, 24.0, 34.0, 23.0, 30.0, 32.0, 33.0, 26.0, 39.0, 35.0, 41.0, 36.0, 36.0, 38.0, 35.0, 31.0, 34.0, 30.0, 36.0, 34.0, 24.0, 29.0, 24.0, 21.0, 27.0, 26.0, 25.0, 9.0, 9.0, 10.0, 12.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.539243698120117, -21.860074996948242, -21.180908203125, -20.501739501953125, -19.82257080078125, -19.143402099609375, -18.4642333984375, -17.785066604614258, -17.105897903442383, -16.426729202270508, -15.74756145477295, -15.06839370727539, -14.389225006103516, -13.71005630493164, -13.030888557434082, -12.351720809936523, -11.672552108764648, -10.993383407592773, -10.314215660095215, -9.635047912597656, -8.955879211425781, -8.276710510253906, -7.597542762756348, -6.918374538421631, -6.239206314086914, -5.560038089752197, -4.8808698654174805, -4.201701641082764, -3.522533416748047, -2.84336519241333, -2.1641969680786133, -1.4850287437438965, -0.8058586120605469, -0.12669038772583008, 0.5524778366088867, 1.2316460609436035, 1.9108142852783203, 2.589982509613037, 3.269150733947754, 3.9483189582824707, 4.6274871826171875, 5.306655406951904, 5.985823631286621, 6.664991855621338, 7.344160079956055, 8.02332878112793, 8.702496528625488, 9.381664276123047, 10.060832977294922, 10.740001678466797, 11.419169425964355, 12.098337173461914, 12.777505874633789, 13.456674575805664, 14.135842323303223, 14.815010070800781, 15.494178771972656, 16.17334747314453, 16.852516174316406, 17.53168296813965, 18.210851669311523, 18.8900203704834, 19.56918716430664, 20.248355865478516, 20.92752456665039]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 12.0, 12.0, 9.0, 10.0, 14.0, 15.0, 16.0, 22.0, 21.0, 19.0, 28.0, 33.0, 25.0, 38.0, 33.0, 30.0, 45.0, 38.0, 46.0, 30.0, 43.0, 38.0, 50.0, 48.0, 40.0, 35.0, 25.0, 32.0, 29.0, 18.0, 17.0, 17.0, 16.0, 17.0, 13.0, 6.0, 12.0, 7.0, 8.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9931640625, -1.9227142333984375, -1.852264404296875, -1.7818145751953125, -1.71136474609375, -1.6409149169921875, -1.570465087890625, -1.5000152587890625, -1.4295654296875, -1.3591156005859375, -1.288665771484375, -1.2182159423828125, -1.14776611328125, -1.0773162841796875, -1.006866455078125, -0.9364166259765625, -0.865966796875, -0.7955169677734375, -0.725067138671875, -0.6546173095703125, -0.58416748046875, -0.5137176513671875, -0.443267822265625, -0.3728179931640625, -0.3023681640625, -0.2319183349609375, -0.161468505859375, -0.0910186767578125, -0.02056884765625, 0.0498809814453125, 0.120330810546875, 0.1907806396484375, 0.26123046875, 0.3316802978515625, 0.402130126953125, 0.4725799560546875, 0.54302978515625, 0.6134796142578125, 0.683929443359375, 0.7543792724609375, 0.8248291015625, 0.8952789306640625, 0.965728759765625, 1.0361785888671875, 1.10662841796875, 1.1770782470703125, 1.247528076171875, 1.3179779052734375, 1.388427734375, 1.4588775634765625, 1.529327392578125, 1.5997772216796875, 1.67022705078125, 1.7406768798828125, 1.811126708984375, 1.8815765380859375, 1.9520263671875, 2.0224761962890625, 2.092926025390625, 2.1633758544921875, 2.23382568359375, 2.3042755126953125, 2.374725341796875, 2.4451751708984375, 2.515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 8.0, 16.0, 15.0, 14.0, 23.0, 21.0, 37.0, 48.0, 95.0, 152.0, 236.0, 398.0, 991.0, 2955.0, 13246.0, 90253.0, 644746.0, 2020426.0, 1185892.0, 200123.0, 26597.0, 5053.0, 1457.0, 618.0, 296.0, 173.0, 119.0, 89.0, 54.0, 38.0, 18.0, 17.0, 18.0, 7.0, 12.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.40625, -4.271484375, -4.13671875, -4.001953125, -3.8671875, -3.732421875, -3.59765625, -3.462890625, -3.328125, -3.193359375, -3.05859375, -2.923828125, -2.7890625, -2.654296875, -2.51953125, -2.384765625, -2.25, -2.115234375, -1.98046875, -1.845703125, -1.7109375, -1.576171875, -1.44140625, -1.306640625, -1.171875, -1.037109375, -0.90234375, -0.767578125, -0.6328125, -0.498046875, -0.36328125, -0.228515625, -0.09375, 0.041015625, 0.17578125, 0.310546875, 0.4453125, 0.580078125, 0.71484375, 0.849609375, 0.984375, 1.119140625, 1.25390625, 1.388671875, 1.5234375, 1.658203125, 1.79296875, 1.927734375, 2.0625, 2.197265625, 2.33203125, 2.466796875, 2.6015625, 2.736328125, 2.87109375, 3.005859375, 3.140625, 3.275390625, 3.41015625, 3.544921875, 3.6796875, 3.814453125, 3.94921875, 4.083984375, 4.21875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 10.0, 13.0, 16.0, 28.0, 54.0, 58.0, 91.0, 162.0, 232.0, 310.0, 431.0, 513.0, 535.0, 490.0, 369.0, 271.0, 171.0, 109.0, 66.0, 61.0, 26.0, 24.0, 15.0, 5.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -5.99774169921875, -5.7767333984375, -5.55572509765625, -5.334716796875, -5.11370849609375, -4.8927001953125, -4.67169189453125, -4.45068359375, -4.22967529296875, -4.0086669921875, -3.78765869140625, -3.566650390625, -3.34564208984375, -3.1246337890625, -2.90362548828125, -2.6826171875, -2.46160888671875, -2.2406005859375, -2.01959228515625, -1.798583984375, -1.57757568359375, -1.3565673828125, -1.13555908203125, -0.91455078125, -0.69354248046875, -0.4725341796875, -0.25152587890625, -0.030517578125, 0.19049072265625, 0.4114990234375, 0.63250732421875, 0.853515625, 1.07452392578125, 1.2955322265625, 1.51654052734375, 1.737548828125, 1.95855712890625, 2.1795654296875, 2.40057373046875, 2.62158203125, 2.84259033203125, 3.0635986328125, 3.28460693359375, 3.505615234375, 3.72662353515625, 3.9476318359375, 4.16864013671875, 4.3896484375, 4.61065673828125, 4.8316650390625, 5.05267333984375, 5.273681640625, 5.49468994140625, 5.7156982421875, 5.93670654296875, 6.15771484375, 6.37872314453125, 6.5997314453125, 6.82073974609375, 7.041748046875, 7.26275634765625, 7.4837646484375, 7.70477294921875, 7.92578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 7.0, 9.0, 17.0, 16.0, 30.0, 41.0, 75.0, 72.0, 124.0, 165.0, 284.0, 550.0, 1624.0, 16959.0, 1029131.0, 3072042.0, 68404.0, 2931.0, 776.0, 362.0, 191.0, 128.0, 82.0, 78.0, 55.0, 43.0, 29.0, 17.0, 11.0, 7.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.21875, -14.7735595703125, -14.328369140625, -13.8831787109375, -13.43798828125, -12.9927978515625, -12.547607421875, -12.1024169921875, -11.6572265625, -11.2120361328125, -10.766845703125, -10.3216552734375, -9.87646484375, -9.4312744140625, -8.986083984375, -8.5408935546875, -8.095703125, -7.6505126953125, -7.205322265625, -6.7601318359375, -6.31494140625, -5.8697509765625, -5.424560546875, -4.9793701171875, -4.5341796875, -4.0889892578125, -3.643798828125, -3.1986083984375, -2.75341796875, -2.3082275390625, -1.863037109375, -1.4178466796875, -0.97265625, -0.5274658203125, -0.082275390625, 0.3629150390625, 0.80810546875, 1.2532958984375, 1.698486328125, 2.1436767578125, 2.5888671875, 3.0340576171875, 3.479248046875, 3.9244384765625, 4.36962890625, 4.8148193359375, 5.260009765625, 5.7052001953125, 6.150390625, 6.5955810546875, 7.040771484375, 7.4859619140625, 7.93115234375, 8.3763427734375, 8.821533203125, 9.2667236328125, 9.7119140625, 10.1571044921875, 10.602294921875, 11.0474853515625, 11.49267578125, 11.9378662109375, 12.383056640625, 12.8282470703125, 13.2734375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 17.0, 26.0, 71.0, 124.0, 202.0, 229.0, 168.0, 88.0, 57.0, 21.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.436946868896484, -42.96480178833008, -41.49265670776367, -40.0205078125, -38.548362731933594, -37.07621765136719, -35.60407257080078, -34.131927490234375, -32.65978240966797, -31.187637329101562, -29.715490341186523, -28.243345260620117, -26.77120018005371, -25.299053192138672, -23.826908111572266, -22.35476303100586, -20.88261604309082, -19.410470962524414, -17.938323974609375, -16.46617889404297, -14.994033813476562, -13.52188777923584, -12.049741744995117, -10.577596664428711, -9.105450630187988, -7.633305072784424, -6.161159515380859, -4.689013481140137, -3.2168679237365723, -1.7447223663330078, -0.27257633209228516, 1.199568748474121, 2.6717147827148438, 4.143860340118408, 5.616005897521973, 7.088151931762695, 8.560297012329102, 10.032443046569824, 11.504589080810547, 12.976734161376953, 14.448880195617676, 15.921026229858398, 17.393171310424805, 18.865318298339844, 20.33746337890625, 21.809608459472656, 23.281753540039062, 24.75389862060547, 26.226045608520508, 27.698190689086914, 29.170337677001953, 30.64248275756836, 32.114627838134766, 33.58677291870117, 35.058921813964844, 36.53106689453125, 38.003211975097656, 39.47535705566406, 40.94750213623047, 42.419647216796875, 43.89179611206055, 45.36394119262695, 46.83608627319336, 48.308231353759766, 49.78037643432617]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 7.0, 8.0, 5.0, 11.0, 14.0, 15.0, 12.0, 16.0, 20.0, 24.0, 29.0, 25.0, 31.0, 34.0, 44.0, 38.0, 32.0, 24.0, 33.0, 38.0, 33.0, 42.0, 45.0, 39.0, 25.0, 43.0, 35.0, 30.0, 32.0, 23.0, 32.0, 19.0, 14.0, 12.0, 15.0, 17.0, 14.0, 17.0, 12.0, 10.0, 5.0, 7.0, 6.0, 1.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.432432174682617, -15.915843963623047, -15.399256706237793, -14.882668495178223, -14.366081237792969, -13.849493026733398, -13.332904815673828, -12.816316604614258, -12.299729347229004, -11.783141136169434, -11.26655387878418, -10.74996566772461, -10.233377456665039, -9.716790199279785, -9.200201988220215, -8.683614730834961, -8.16702651977539, -7.6504387855529785, -7.133851051330566, -6.617262840270996, -6.100675106048584, -5.584087371826172, -5.067499160766602, -4.5509114265441895, -4.034323692321777, -3.5177359580993652, -3.001147985458374, -2.484560012817383, -1.9679722785949707, -1.4513845443725586, -0.9347965717315674, -0.41820859909057617, 0.09837722778320312, 0.6149650812149048, 1.1315529346466064, 1.648140788078308, 2.1647286415100098, 2.681316375732422, 3.197904348373413, 3.7144923210144043, 4.231080055236816, 4.7476677894592285, 5.264255523681641, 5.780843734741211, 6.297431468963623, 6.814019203186035, 7.3306074142456055, 7.847195148468018, 8.36378288269043, 8.88037109375, 9.396958351135254, 9.913546562194824, 10.430133819580078, 10.946722030639648, 11.463310241699219, 11.979898452758789, 12.496485710144043, 13.013073921203613, 13.529661178588867, 14.046249389648438, 14.562837600708008, 15.079424858093262, 15.596013069152832, 16.112600326538086, 16.629188537597656]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 14.0, 13.0, 17.0, 11.0, 21.0, 11.0, 19.0, 21.0, 24.0, 23.0, 29.0, 38.0, 31.0, 40.0, 51.0, 42.0, 49.0, 41.0, 33.0, 44.0, 33.0, 46.0, 50.0, 25.0, 29.0, 32.0, 22.0, 22.0, 26.0, 16.0, 17.0, 15.0, 14.0, 10.0, 5.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0234375, -1.95208740234375, -1.8807373046875, -1.80938720703125, -1.738037109375, -1.66668701171875, -1.5953369140625, -1.52398681640625, -1.45263671875, -1.38128662109375, -1.3099365234375, -1.23858642578125, -1.167236328125, -1.09588623046875, -1.0245361328125, -0.95318603515625, -0.8818359375, -0.81048583984375, -0.7391357421875, -0.66778564453125, -0.596435546875, -0.52508544921875, -0.4537353515625, -0.38238525390625, -0.31103515625, -0.23968505859375, -0.1683349609375, -0.09698486328125, -0.025634765625, 0.04571533203125, 0.1170654296875, 0.18841552734375, 0.259765625, 0.33111572265625, 0.4024658203125, 0.47381591796875, 0.545166015625, 0.61651611328125, 0.6878662109375, 0.75921630859375, 0.83056640625, 0.90191650390625, 0.9732666015625, 1.04461669921875, 1.115966796875, 1.18731689453125, 1.2586669921875, 1.33001708984375, 1.4013671875, 1.47271728515625, 1.5440673828125, 1.61541748046875, 1.686767578125, 1.75811767578125, 1.8294677734375, 1.90081787109375, 1.97216796875, 2.04351806640625, 2.1148681640625, 2.18621826171875, 2.257568359375, 2.32891845703125, 2.4002685546875, 2.47161865234375, 2.54296875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 23.0, 30.0, 54.0, 62.0, 77.0, 136.0, 201.0, 294.0, 395.0, 549.0, 863.0, 1257.0, 1806.0, 2674.0, 3805.0, 5484.0, 8146.0, 11627.0, 17505.0, 26208.0, 40953.0, 68879.0, 124148.0, 260479.0, 206517.0, 101634.0, 57913.0, 35290.0, 22923.0, 15102.0, 10488.0, 7073.0, 4935.0, 3467.0, 2332.0, 1625.0, 1204.0, 747.0, 521.0, 325.0, 257.0, 194.0, 126.0, 72.0, 55.0, 37.0, 25.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.391845703125, -0.37953948974609375, -0.3672332763671875, -0.35492706298828125, -0.342620849609375, -0.33031463623046875, -0.3180084228515625, -0.30570220947265625, -0.29339599609375, -0.28108978271484375, -0.2687835693359375, -0.25647735595703125, -0.244171142578125, -0.23186492919921875, -0.2195587158203125, -0.20725250244140625, -0.1949462890625, -0.18264007568359375, -0.1703338623046875, -0.15802764892578125, -0.145721435546875, -0.13341522216796875, -0.1211090087890625, -0.10880279541015625, -0.09649658203125, -0.08419036865234375, -0.0718841552734375, -0.05957794189453125, -0.047271728515625, -0.03496551513671875, -0.0226593017578125, -0.01035308837890625, 0.001953125, 0.01425933837890625, 0.0265655517578125, 0.03887176513671875, 0.051177978515625, 0.06348419189453125, 0.0757904052734375, 0.08809661865234375, 0.10040283203125, 0.11270904541015625, 0.1250152587890625, 0.13732147216796875, 0.149627685546875, 0.16193389892578125, 0.1742401123046875, 0.18654632568359375, 0.1988525390625, 0.21115875244140625, 0.2234649658203125, 0.23577117919921875, 0.248077392578125, 0.26038360595703125, 0.2726898193359375, 0.28499603271484375, 0.29730224609375, 0.30960845947265625, 0.3219146728515625, 0.33422088623046875, 0.346527099609375, 0.35883331298828125, 0.3711395263671875, 0.38344573974609375, 0.395751953125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 18.0, 12.0, 15.0, 11.0, 20.0, 23.0, 22.0, 20.0, 27.0, 17.0, 30.0, 41.0, 34.0, 27.0, 28.0, 43.0, 38.0, 40.0, 1063.0, 42.0, 48.0, 27.0, 33.0, 29.0, 27.0, 30.0, 24.0, 33.0, 31.0, 18.0, 15.0, 17.0, 14.0, 11.0, 16.0, 12.0, 13.0, 10.0, 5.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-1.40234375, -1.3595123291015625, -1.316680908203125, -1.2738494873046875, -1.23101806640625, -1.1881866455078125, -1.145355224609375, -1.1025238037109375, -1.0596923828125, -1.0168609619140625, -0.974029541015625, -0.9311981201171875, -0.88836669921875, -0.8455352783203125, -0.802703857421875, -0.7598724365234375, -0.717041015625, -0.6742095947265625, -0.631378173828125, -0.5885467529296875, -0.54571533203125, -0.5028839111328125, -0.460052490234375, -0.4172210693359375, -0.3743896484375, -0.3315582275390625, -0.288726806640625, -0.2458953857421875, -0.20306396484375, -0.1602325439453125, -0.117401123046875, -0.0745697021484375, -0.03173828125, 0.0110931396484375, 0.053924560546875, 0.0967559814453125, 0.13958740234375, 0.1824188232421875, 0.225250244140625, 0.2680816650390625, 0.3109130859375, 0.3537445068359375, 0.396575927734375, 0.4394073486328125, 0.48223876953125, 0.5250701904296875, 0.567901611328125, 0.6107330322265625, 0.653564453125, 0.6963958740234375, 0.739227294921875, 0.7820587158203125, 0.82489013671875, 0.8677215576171875, 0.910552978515625, 0.9533843994140625, 0.9962158203125, 1.0390472412109375, 1.081878662109375, 1.1247100830078125, 1.16754150390625, 1.2103729248046875, 1.253204345703125, 1.2960357666015625, 1.3388671875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 7.0, 1.0, 6.0, 7.0, 12.0, 15.0, 29.0, 38.0, 58.0, 78.0, 114.0, 180.0, 223.0, 338.0, 537.0, 650.0, 1030.0, 1518.0, 2065.0, 3145.0, 4553.0, 6539.0, 9904.0, 14499.0, 22395.0, 35776.0, 57815.0, 100816.0, 205360.0, 1316894.0, 123325.0, 68614.0, 41938.0, 26310.0, 16901.0, 11258.0, 7738.0, 5136.0, 3486.0, 2381.0, 1664.0, 1194.0, 796.0, 509.0, 439.0, 272.0, 199.0, 122.0, 104.0, 57.0, 30.0, 22.0, 21.0, 13.0, 6.0, 2.0, 8.0, 1.0, 1.0, 1.0], "bins": [-0.40380859375, -0.391632080078125, -0.37945556640625, -0.367279052734375, -0.3551025390625, -0.342926025390625, -0.33074951171875, -0.318572998046875, -0.306396484375, -0.294219970703125, -0.28204345703125, -0.269866943359375, -0.2576904296875, -0.245513916015625, -0.23333740234375, -0.221160888671875, -0.208984375, -0.196807861328125, -0.18463134765625, -0.172454833984375, -0.1602783203125, -0.148101806640625, -0.13592529296875, -0.123748779296875, -0.111572265625, -0.099395751953125, -0.08721923828125, -0.075042724609375, -0.0628662109375, -0.050689697265625, -0.03851318359375, -0.026336669921875, -0.01416015625, -0.001983642578125, 0.01019287109375, 0.022369384765625, 0.0345458984375, 0.046722412109375, 0.05889892578125, 0.071075439453125, 0.083251953125, 0.095428466796875, 0.10760498046875, 0.119781494140625, 0.1319580078125, 0.144134521484375, 0.15631103515625, 0.168487548828125, 0.1806640625, 0.192840576171875, 0.20501708984375, 0.217193603515625, 0.2293701171875, 0.241546630859375, 0.25372314453125, 0.265899658203125, 0.278076171875, 0.290252685546875, 0.30242919921875, 0.314605712890625, 0.3267822265625, 0.338958740234375, 0.35113525390625, 0.363311767578125, 0.37548828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 14.0, 13.0, 18.0, 26.0, 26.0, 34.0, 35.0, 58.0, 57.0, 65.0, 76.0, 74.0, 79.0, 64.0, 61.0, 51.0, 36.0, 36.0, 34.0, 23.0, 19.0, 22.0, 11.0, 11.0, 11.0, 8.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031113624572753906, -0.00030126050114631653, -0.000291384756565094, -0.00028150901198387146, -0.0002716332674026489, -0.0002617575228214264, -0.00025188177824020386, -0.00024200603365898132, -0.0002321302890777588, -0.00022225454449653625, -0.00021237879991531372, -0.0002025030553340912, -0.00019262731075286865, -0.00018275156617164612, -0.00017287582159042358, -0.00016300007700920105, -0.00015312433242797852, -0.00014324858784675598, -0.00013337284326553345, -0.0001234970986843109, -0.00011362135410308838, -0.00010374560952186584, -9.386986494064331e-05, -8.399412035942078e-05, -7.411837577819824e-05, -6.424263119697571e-05, -5.4366886615753174e-05, -4.449114203453064e-05, -3.4615397453308105e-05, -2.473965287208557e-05, -1.4863908290863037e-05, -4.988163709640503e-06, 4.887580871582031e-06, 1.4763325452804565e-05, 2.46390700340271e-05, 3.4514814615249634e-05, 4.439055919647217e-05, 5.42663037776947e-05, 6.414204835891724e-05, 7.401779294013977e-05, 8.38935375213623e-05, 9.376928210258484e-05, 0.00010364502668380737, 0.00011352077126502991, 0.00012339651584625244, 0.00013327226042747498, 0.0001431480050086975, 0.00015302374958992004, 0.00016289949417114258, 0.0001727752387523651, 0.00018265098333358765, 0.00019252672791481018, 0.00020240247249603271, 0.00021227821707725525, 0.00022215396165847778, 0.00023202970623970032, 0.00024190545082092285, 0.0002517811954021454, 0.0002616569399833679, 0.00027153268456459045, 0.000281408429145813, 0.0002912841737270355, 0.00030115991830825806, 0.0003110356628894806, 0.0003209114074707031]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 9.0, 13.0, 12.0, 16.0, 39.0, 27.0, 65.0, 57.0, 87.0, 125.0, 213.0, 452.0, 1031.0, 49079.0, 993322.0, 2454.0, 617.0, 338.0, 212.0, 127.0, 71.0, 50.0, 35.0, 27.0, 14.0, 13.0, 13.0, 5.0, 6.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006374359130859375, -0.0061827898025512695, -0.005991220474243164, -0.005799651145935059, -0.005608081817626953, -0.005416512489318848, -0.005224943161010742, -0.005033373832702637, -0.004841804504394531, -0.004650235176086426, -0.00445866584777832, -0.004267096519470215, -0.004075527191162109, -0.003883957862854004, -0.0036923885345458984, -0.003500819206237793, -0.0033092498779296875, -0.003117680549621582, -0.0029261112213134766, -0.002734541893005371, -0.0025429725646972656, -0.00235140323638916, -0.0021598339080810547, -0.0019682645797729492, -0.0017766952514648438, -0.0015851259231567383, -0.0013935565948486328, -0.0012019872665405273, -0.0010104179382324219, -0.0008188486099243164, -0.0006272792816162109, -0.00043570995330810547, -0.000244140625, -5.257129669189453e-05, 0.00013899803161621094, 0.0003305673599243164, 0.0005221366882324219, 0.0007137060165405273, 0.0009052753448486328, 0.0010968446731567383, 0.0012884140014648438, 0.0014799833297729492, 0.0016715526580810547, 0.0018631219863891602, 0.0020546913146972656, 0.002246260643005371, 0.0024378299713134766, 0.002629399299621582, 0.0028209686279296875, 0.003012537956237793, 0.0032041072845458984, 0.003395676612854004, 0.0035872459411621094, 0.003778815269470215, 0.00397038459777832, 0.004161953926086426, 0.004353523254394531, 0.004545092582702637, 0.004736661911010742, 0.004928231239318848, 0.005119800567626953, 0.005311369895935059, 0.005502939224243164, 0.0056945085525512695, 0.005886077880859375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 31.0, 171.0, 409.0, 312.0, 78.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.001052223495207727, -0.001031066058203578, -0.0010099085047841072, -0.0009887510677799582, -0.0009675935725681484, -0.0009464360773563385, -0.0009252786403521895, -0.0009041211451403797, -0.0008829636499285698, -0.0008618061547167599, -0.000840648717712611, -0.0008194912225008011, -0.0007983337272889912, -0.0007771762320771813, -0.0007560187950730324, -0.0007348612998612225, -0.0007137038628570735, -0.0006925463676452637, -0.0006713889306411147, -0.0006502314354293048, -0.000629073940217495, -0.000607916503213346, -0.0005867590080015361, -0.0005656015127897263, -0.0005444440757855773, -0.0005232865805737674, -0.0005021291435696185, -0.0004809716483578086, -0.0004598141531459987, -0.0004386566870380193, -0.0004174992209300399, -0.00039634172571823, -0.00037518423050642014, -0.0003540267643984407, -0.00033286926918663085, -0.00031171180307865143, -0.00029055430786684155, -0.00026939684175886214, -0.0002482393756508827, -0.00022708189499098808, -0.00020592441433109343, -0.00018476693367119879, -0.00016360945301130414, -0.00014245198690332472, -0.00012129450624343008, -0.00010013702558353543, -7.897955947555602e-05, -5.782207881566137e-05, -3.6664598155766726e-05, -1.5507121133850887e-05, 5.650355888064951e-06, 2.6807829272001982e-05, 4.796530993189663e-05, 6.912279059179127e-05, 9.028025669977069e-05, 0.00011143773735966533, 0.00013259521801955998, 0.00015375269867945462, 0.00017491017933934927, 0.0001960676454473287, 0.00021722512610722333, 0.00023838260676711798, 0.0002595400728750974, 0.0002806975389830768, 0.0003018550341948867]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 13.0, 8.0, 11.0, 14.0, 16.0, 18.0, 24.0, 29.0, 19.0, 20.0, 35.0, 30.0, 48.0, 34.0, 42.0, 37.0, 54.0, 41.0, 46.0, 42.0, 46.0, 34.0, 46.0, 32.0, 41.0, 25.0, 20.0, 26.0, 11.0, 20.0, 20.0, 15.0, 17.0, 11.0, 6.0, 10.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001252293586730957, -0.00012072548270225525, -0.0001162216067314148, -0.00011171773076057434, -0.00010721385478973389, -0.00010270997881889343, -9.820610284805298e-05, -9.370222687721252e-05, -8.919835090637207e-05, -8.469447493553162e-05, -8.019059896469116e-05, -7.568672299385071e-05, -7.118284702301025e-05, -6.66789710521698e-05, -6.217509508132935e-05, -5.767121911048889e-05, -5.316734313964844e-05, -4.8663467168807983e-05, -4.415959119796753e-05, -3.9655715227127075e-05, -3.515183925628662e-05, -3.064796328544617e-05, -2.6144087314605713e-05, -2.164021134376526e-05, -1.7136335372924805e-05, -1.263245940208435e-05, -8.128583431243896e-06, -3.6247074604034424e-06, 8.791685104370117e-07, 5.383044481277466e-06, 9.88692045211792e-06, 1.4390796422958374e-05, 1.8894672393798828e-05, 2.3398548364639282e-05, 2.7902424335479736e-05, 3.240630030632019e-05, 3.6910176277160645e-05, 4.14140522480011e-05, 4.591792821884155e-05, 5.042180418968201e-05, 5.492568016052246e-05, 5.9429556131362915e-05, 6.393343210220337e-05, 6.843730807304382e-05, 7.294118404388428e-05, 7.744506001472473e-05, 8.194893598556519e-05, 8.645281195640564e-05, 9.09566879272461e-05, 9.546056389808655e-05, 9.9964439868927e-05, 0.00010446831583976746, 0.00010897219181060791, 0.00011347606778144836, 0.00011797994375228882, 0.00012248381972312927, 0.00012698769569396973, 0.00013149157166481018, 0.00013599544763565063, 0.0001404993236064911, 0.00014500319957733154, 0.000149507075548172, 0.00015401095151901245, 0.0001585148274898529, 0.00016301870346069336]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 14.0, 13.0, 17.0, 11.0, 21.0, 11.0, 18.0, 22.0, 24.0, 23.0, 29.0, 38.0, 31.0, 40.0, 51.0, 42.0, 49.0, 41.0, 33.0, 44.0, 33.0, 46.0, 50.0, 25.0, 29.0, 32.0, 22.0, 22.0, 26.0, 16.0, 17.0, 15.0, 14.0, 10.0, 5.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0234375, -1.95208740234375, -1.8807373046875, -1.80938720703125, -1.738037109375, -1.66668701171875, -1.5953369140625, -1.52398681640625, -1.45263671875, -1.38128662109375, -1.3099365234375, -1.23858642578125, -1.167236328125, -1.09588623046875, -1.0245361328125, -0.95318603515625, -0.8818359375, -0.81048583984375, -0.7391357421875, -0.66778564453125, -0.596435546875, -0.52508544921875, -0.4537353515625, -0.38238525390625, -0.31103515625, -0.23968505859375, -0.1683349609375, -0.09698486328125, -0.025634765625, 0.04571533203125, 0.1170654296875, 0.18841552734375, 0.259765625, 0.33111572265625, 0.4024658203125, 0.47381591796875, 0.545166015625, 0.61651611328125, 0.6878662109375, 0.75921630859375, 0.83056640625, 0.90191650390625, 0.9732666015625, 1.04461669921875, 1.115966796875, 1.18731689453125, 1.2586669921875, 1.33001708984375, 1.4013671875, 1.47271728515625, 1.5440673828125, 1.61541748046875, 1.686767578125, 1.75811767578125, 1.8294677734375, 1.90081787109375, 1.97216796875, 2.04351806640625, 2.1148681640625, 2.18621826171875, 2.257568359375, 2.32891845703125, 2.4002685546875, 2.47161865234375, 2.54296875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 8.0, 12.0, 29.0, 28.0, 46.0, 83.0, 109.0, 165.0, 272.0, 375.0, 746.0, 1437.0, 3049.0, 6783.0, 15015.0, 32352.0, 68894.0, 148818.0, 275635.0, 254427.0, 128304.0, 59757.0, 27843.0, 12853.0, 5893.0, 2642.0, 1285.0, 675.0, 381.0, 212.0, 150.0, 82.0, 59.0, 49.0, 25.0, 19.0, 18.0, 8.0, 9.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.087921142578125, -2.01568603515625, -1.943450927734375, -1.8712158203125, -1.798980712890625, -1.72674560546875, -1.654510498046875, -1.582275390625, -1.510040283203125, -1.43780517578125, -1.365570068359375, -1.2933349609375, -1.221099853515625, -1.14886474609375, -1.076629638671875, -1.00439453125, -0.932159423828125, -0.85992431640625, -0.787689208984375, -0.7154541015625, -0.643218994140625, -0.57098388671875, -0.498748779296875, -0.426513671875, -0.354278564453125, -0.28204345703125, -0.209808349609375, -0.1375732421875, -0.065338134765625, 0.00689697265625, 0.079132080078125, 0.1513671875, 0.223602294921875, 0.29583740234375, 0.368072509765625, 0.4403076171875, 0.512542724609375, 0.58477783203125, 0.657012939453125, 0.729248046875, 0.801483154296875, 0.87371826171875, 0.945953369140625, 1.0181884765625, 1.090423583984375, 1.16265869140625, 1.234893798828125, 1.30712890625, 1.379364013671875, 1.45159912109375, 1.523834228515625, 1.5960693359375, 1.668304443359375, 1.74053955078125, 1.812774658203125, 1.885009765625, 1.957244873046875, 2.02947998046875, 2.101715087890625, 2.1739501953125, 2.246185302734375, 2.31842041015625, 2.390655517578125, 2.462890625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 6.0, 14.0, 11.0, 11.0, 12.0, 16.0, 30.0, 31.0, 38.0, 45.0, 57.0, 68.0, 85.0, 141.0, 411.0, 1477.0, 168.0, 81.0, 57.0, 64.0, 43.0, 44.0, 33.0, 27.0, 24.0, 10.0, 9.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.9559326171875, -14.552490234375, -14.1490478515625, -13.74560546875, -13.3421630859375, -12.938720703125, -12.5352783203125, -12.1318359375, -11.7283935546875, -11.324951171875, -10.9215087890625, -10.51806640625, -10.1146240234375, -9.711181640625, -9.3077392578125, -8.904296875, -8.5008544921875, -8.097412109375, -7.6939697265625, -7.29052734375, -6.8870849609375, -6.483642578125, -6.0802001953125, -5.6767578125, -5.2733154296875, -4.869873046875, -4.4664306640625, -4.06298828125, -3.6595458984375, -3.256103515625, -2.8526611328125, -2.44921875, -2.0457763671875, -1.642333984375, -1.2388916015625, -0.83544921875, -0.4320068359375, -0.028564453125, 0.3748779296875, 0.7783203125, 1.1817626953125, 1.585205078125, 1.9886474609375, 2.39208984375, 2.7955322265625, 3.198974609375, 3.6024169921875, 4.005859375, 4.4093017578125, 4.812744140625, 5.2161865234375, 5.61962890625, 6.0230712890625, 6.426513671875, 6.8299560546875, 7.2333984375, 7.6368408203125, 8.040283203125, 8.4437255859375, 8.84716796875, 9.2506103515625, 9.654052734375, 10.0574951171875, 10.4609375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 11.0, 8.0, 12.0, 18.0, 20.0, 29.0, 26.0, 61.0, 77.0, 118.0, 189.0, 336.0, 622.0, 3461.0, 2998112.0, 140093.0, 1213.0, 485.0, 263.0, 147.0, 97.0, 68.0, 52.0, 45.0, 30.0, 27.0, 15.0, 18.0, 17.0, 5.0, 5.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.390625, -26.328857421875, -25.26708984375, -24.205322265625, -23.1435546875, -22.081787109375, -21.02001953125, -19.958251953125, -18.896484375, -17.834716796875, -16.77294921875, -15.711181640625, -14.6494140625, -13.587646484375, -12.52587890625, -11.464111328125, -10.40234375, -9.340576171875, -8.27880859375, -7.217041015625, -6.1552734375, -5.093505859375, -4.03173828125, -2.969970703125, -1.908203125, -0.846435546875, 0.21533203125, 1.277099609375, 2.3388671875, 3.400634765625, 4.46240234375, 5.524169921875, 6.5859375, 7.647705078125, 8.70947265625, 9.771240234375, 10.8330078125, 11.894775390625, 12.95654296875, 14.018310546875, 15.080078125, 16.141845703125, 17.20361328125, 18.265380859375, 19.3271484375, 20.388916015625, 21.45068359375, 22.512451171875, 23.57421875, 24.635986328125, 25.69775390625, 26.759521484375, 27.8212890625, 28.883056640625, 29.94482421875, 31.006591796875, 32.068359375, 33.130126953125, 34.19189453125, 35.253662109375, 36.3154296875, 37.377197265625, 38.43896484375, 39.500732421875, 40.5625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 10.0, 38.0, 109.0, 222.0, 303.0, 203.0, 93.0, 28.0, 10.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.79438591003418, -28.78071403503418, -27.76704216003418, -26.75337028503418, -25.73969841003418, -24.72602653503418, -23.712352752685547, -22.698680877685547, -21.685009002685547, -20.671337127685547, -19.657665252685547, -18.643993377685547, -17.630321502685547, -16.616649627685547, -15.60297679901123, -14.58930492401123, -13.575634002685547, -12.561962127685547, -11.548290252685547, -10.534618377685547, -9.520946502685547, -8.507274627685547, -7.4936017990112305, -6.4799299240112305, -5.4662580490112305, -4.4525861740112305, -3.4389140605926514, -2.4252419471740723, -1.4115700721740723, -0.39789819717407227, 0.6157741546630859, 1.629446029663086, 2.643115997314453, 3.656787872314453, 4.670459747314453, 5.684132099151611, 6.697803974151611, 7.711475849151611, 8.72514820098877, 9.73882007598877, 10.75249195098877, 11.76616382598877, 12.77983570098877, 13.793508529663086, 14.807180404663086, 15.820852279663086, 16.834524154663086, 17.848196029663086, 18.861867904663086, 19.875539779663086, 20.889211654663086, 21.902883529663086, 22.916555404663086, 23.930227279663086, 24.94390106201172, 25.95757293701172, 26.97124481201172, 27.98491668701172, 28.99858856201172, 30.01226043701172, 31.02593231201172, 32.03960418701172, 33.05327606201172, 34.06694793701172, 35.08061981201172]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 5.0, 9.0, 11.0, 17.0, 18.0, 19.0, 20.0, 15.0, 26.0, 24.0, 23.0, 33.0, 35.0, 32.0, 37.0, 41.0, 38.0, 36.0, 36.0, 49.0, 51.0, 42.0, 35.0, 35.0, 32.0, 29.0, 23.0, 28.0, 24.0, 26.0, 26.0, 20.0, 19.0, 18.0, 14.0, 7.0, 5.0, 9.0, 3.0, 4.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.522613525390625, -18.866973876953125, -18.211334228515625, -17.555696487426758, -16.900056838989258, -16.244417190551758, -15.588777542114258, -14.933137893676758, -14.277499198913574, -13.621859550476074, -12.96622085571289, -12.31058120727539, -11.65494155883789, -10.999302864074707, -10.343663215637207, -9.688024520874023, -9.032384872436523, -8.376745223999023, -7.72110652923584, -7.06546688079834, -6.409827709197998, -5.754188537597656, -5.098548889160156, -4.4429097175598145, -3.7872705459594727, -3.131631374359131, -2.47599196434021, -1.8203526735305786, -1.1647133827209473, -0.5090742111206055, 0.14656519889831543, 0.8022046089172363, 1.4578437805175781, 2.11348295211792, 2.769122362136841, 3.4247617721557617, 4.0804009437561035, 4.736040115356445, 5.391679763793945, 6.047318935394287, 6.702958106994629, 7.358597278594971, 8.014236450195312, 8.669876098632812, 9.325515747070312, 9.981154441833496, 10.636794090270996, 11.29243278503418, 11.94807243347168, 12.60371208190918, 13.259350776672363, 13.914990425109863, 14.570629119873047, 15.226268768310547, 15.881908416748047, 16.537548065185547, 17.193187713623047, 17.848827362060547, 18.504467010498047, 19.160104751586914, 19.815744400024414, 20.471384048461914, 21.127023696899414, 21.782663345336914, 22.43830108642578]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 6.0, 4.0, 7.0, 5.0, 4.0, 12.0, 11.0, 6.0, 18.0, 16.0, 22.0, 12.0, 25.0, 20.0, 19.0, 27.0, 33.0, 33.0, 32.0, 43.0, 42.0, 26.0, 40.0, 49.0, 41.0, 49.0, 44.0, 32.0, 30.0, 22.0, 38.0, 39.0, 28.0, 26.0, 18.0, 13.0, 14.0, 16.0, 13.0, 9.0, 10.0, 12.0, 6.0, 10.0, 6.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.412109375, -2.335784912109375, -2.25946044921875, -2.183135986328125, -2.1068115234375, -2.030487060546875, -1.95416259765625, -1.877838134765625, -1.801513671875, -1.725189208984375, -1.64886474609375, -1.572540283203125, -1.4962158203125, -1.419891357421875, -1.34356689453125, -1.267242431640625, -1.19091796875, -1.114593505859375, -1.03826904296875, -0.961944580078125, -0.8856201171875, -0.809295654296875, -0.73297119140625, -0.656646728515625, -0.580322265625, -0.503997802734375, -0.42767333984375, -0.351348876953125, -0.2750244140625, -0.198699951171875, -0.12237548828125, -0.046051025390625, 0.0302734375, 0.106597900390625, 0.18292236328125, 0.259246826171875, 0.3355712890625, 0.411895751953125, 0.48822021484375, 0.564544677734375, 0.640869140625, 0.717193603515625, 0.79351806640625, 0.869842529296875, 0.9461669921875, 1.022491455078125, 1.09881591796875, 1.175140380859375, 1.25146484375, 1.327789306640625, 1.40411376953125, 1.480438232421875, 1.5567626953125, 1.633087158203125, 1.70941162109375, 1.785736083984375, 1.862060546875, 1.938385009765625, 2.01470947265625, 2.091033935546875, 2.1673583984375, 2.243682861328125, 2.32000732421875, 2.396331787109375, 2.47265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 3.0, 5.0, 8.0, 12.0, 15.0, 9.0, 14.0, 20.0, 22.0, 20.0, 28.0, 25.0, 34.0, 60.0, 73.0, 144.0, 282.0, 643.0, 2787.0, 46087.0, 1621350.0, 2416521.0, 99917.0, 4383.0, 869.0, 357.0, 170.0, 98.0, 69.0, 50.0, 34.0, 21.0, 26.0, 11.0, 14.0, 9.0, 17.0, 7.0, 11.0, 11.0, 9.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.7109375, -8.4395751953125, -8.168212890625, -7.8968505859375, -7.62548828125, -7.3541259765625, -7.082763671875, -6.8114013671875, -6.5400390625, -6.2686767578125, -5.997314453125, -5.7259521484375, -5.45458984375, -5.1832275390625, -4.911865234375, -4.6405029296875, -4.369140625, -4.0977783203125, -3.826416015625, -3.5550537109375, -3.28369140625, -3.0123291015625, -2.740966796875, -2.4696044921875, -2.1982421875, -1.9268798828125, -1.655517578125, -1.3841552734375, -1.11279296875, -0.8414306640625, -0.570068359375, -0.2987060546875, -0.02734375, 0.2440185546875, 0.515380859375, 0.7867431640625, 1.05810546875, 1.3294677734375, 1.600830078125, 1.8721923828125, 2.1435546875, 2.4149169921875, 2.686279296875, 2.9576416015625, 3.22900390625, 3.5003662109375, 3.771728515625, 4.0430908203125, 4.314453125, 4.5858154296875, 4.857177734375, 5.1285400390625, 5.39990234375, 5.6712646484375, 5.942626953125, 6.2139892578125, 6.4853515625, 6.7567138671875, 7.028076171875, 7.2994384765625, 7.57080078125, 7.8421630859375, 8.113525390625, 8.3848876953125, 8.65625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 7.0, 11.0, 15.0, 22.0, 30.0, 52.0, 67.0, 92.0, 126.0, 164.0, 234.0, 306.0, 385.0, 401.0, 478.0, 389.0, 350.0, 265.0, 189.0, 125.0, 90.0, 80.0, 55.0, 40.0, 24.0, 21.0, 10.0, 14.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.17578125, -6.9925537109375, -6.809326171875, -6.6260986328125, -6.44287109375, -6.2596435546875, -6.076416015625, -5.8931884765625, -5.7099609375, -5.5267333984375, -5.343505859375, -5.1602783203125, -4.97705078125, -4.7938232421875, -4.610595703125, -4.4273681640625, -4.244140625, -4.0609130859375, -3.877685546875, -3.6944580078125, -3.51123046875, -3.3280029296875, -3.144775390625, -2.9615478515625, -2.7783203125, -2.5950927734375, -2.411865234375, -2.2286376953125, -2.04541015625, -1.8621826171875, -1.678955078125, -1.4957275390625, -1.3125, -1.1292724609375, -0.946044921875, -0.7628173828125, -0.57958984375, -0.3963623046875, -0.213134765625, -0.0299072265625, 0.1533203125, 0.3365478515625, 0.519775390625, 0.7030029296875, 0.88623046875, 1.0694580078125, 1.252685546875, 1.4359130859375, 1.619140625, 1.8023681640625, 1.985595703125, 2.1688232421875, 2.35205078125, 2.5352783203125, 2.718505859375, 2.9017333984375, 3.0849609375, 3.2681884765625, 3.451416015625, 3.6346435546875, 3.81787109375, 4.0010986328125, 4.184326171875, 4.3675537109375, 4.55078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 8.0, 3.0, 10.0, 14.0, 10.0, 22.0, 28.0, 47.0, 41.0, 68.0, 90.0, 106.0, 147.0, 203.0, 303.0, 574.0, 2231.0, 40027.0, 2164632.0, 1947216.0, 34738.0, 2103.0, 578.0, 307.0, 219.0, 153.0, 91.0, 83.0, 57.0, 59.0, 37.0, 21.0, 11.0, 12.0, 10.0, 9.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.83203125, -10.3984375, -9.96484375, -9.53125, -9.09765625, -8.6640625, -8.23046875, -7.796875, -7.36328125, -6.9296875, -6.49609375, -6.0625, -5.62890625, -5.1953125, -4.76171875, -4.328125, -3.89453125, -3.4609375, -3.02734375, -2.59375, -2.16015625, -1.7265625, -1.29296875, -0.859375, -0.42578125, 0.0078125, 0.44140625, 0.875, 1.30859375, 1.7421875, 2.17578125, 2.609375, 3.04296875, 3.4765625, 3.91015625, 4.34375, 4.77734375, 5.2109375, 5.64453125, 6.078125, 6.51171875, 6.9453125, 7.37890625, 7.8125, 8.24609375, 8.6796875, 9.11328125, 9.546875, 9.98046875, 10.4140625, 10.84765625, 11.28125, 11.71484375, 12.1484375, 12.58203125, 13.015625, 13.44921875, 13.8828125, 14.31640625, 14.75, 15.18359375, 15.6171875, 16.05078125, 16.484375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 19.0, 31.0, 63.0, 87.0, 123.0, 168.0, 169.0, 155.0, 102.0, 43.0, 27.0, 17.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.459632873535156, -26.364343643188477, -25.269054412841797, -24.173765182495117, -23.078475952148438, -21.983186721801758, -20.887897491455078, -19.7926082611084, -18.69731903076172, -17.60202980041504, -16.50674057006836, -15.41145133972168, -14.316162109375, -13.22087287902832, -12.12558364868164, -11.030294418334961, -9.935005187988281, -8.839715957641602, -7.744426727294922, -6.649137496948242, -5.5538482666015625, -4.458559036254883, -3.363269805908203, -2.2679805755615234, -1.1726913452148438, -0.07740211486816406, 1.0178871154785156, 2.1131763458251953, 3.208465576171875, 4.303754806518555, 5.399044036865234, 6.494333267211914, 7.589618682861328, 8.684907913208008, 9.780197143554688, 10.875486373901367, 11.970775604248047, 13.066064834594727, 14.161354064941406, 15.256643295288086, 16.351932525634766, 17.447221755981445, 18.542510986328125, 19.637800216674805, 20.733089447021484, 21.828378677368164, 22.923667907714844, 24.018957138061523, 25.114246368408203, 26.209535598754883, 27.304824829101562, 28.400114059448242, 29.495403289794922, 30.5906925201416, 31.68598175048828, 32.781272888183594, 33.87656021118164, 34.97184753417969, 36.067138671875, 37.16242980957031, 38.25771713256836, 39.353004455566406, 40.44829559326172, 41.54358673095703, 42.63887405395508]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 12.0, 9.0, 14.0, 18.0, 25.0, 26.0, 35.0, 36.0, 26.0, 34.0, 36.0, 39.0, 33.0, 36.0, 44.0, 43.0, 46.0, 32.0, 45.0, 40.0, 41.0, 42.0, 36.0, 33.0, 35.0, 32.0, 26.0, 16.0, 21.0, 13.0, 12.0, 11.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.082216262817383, -17.480741500854492, -16.879268646240234, -16.277793884277344, -15.676319122314453, -15.074845314025879, -14.473371505737305, -13.871896743774414, -13.27042293548584, -12.668949127197266, -12.067474365234375, -11.4660005569458, -10.864526748657227, -10.263051986694336, -9.661578178405762, -9.060104370117188, -8.458629608154297, -7.8571553230285645, -7.255681037902832, -6.654207229614258, -6.052732944488525, -5.451258659362793, -4.849784851074219, -4.248310565948486, -3.646836280822754, -3.0453619956970215, -2.443887948989868, -1.8424137830734253, -1.2409396171569824, -0.63946533203125, -0.03799128532409668, 0.5634827613830566, 1.1649551391601562, 1.7664293050765991, 2.367903470993042, 2.9693775177001953, 3.5708518028259277, 4.17232608795166, 4.773799896240234, 5.375274181365967, 5.976748466491699, 6.578222751617432, 7.179697036743164, 7.781170845031738, 8.382644653320312, 8.984119415283203, 9.585593223571777, 10.187067031860352, 10.788541793823242, 11.390015602111816, 11.991490364074707, 12.592964172363281, 13.194438934326172, 13.795912742614746, 14.39738655090332, 14.998861312866211, 15.600335121154785, 16.20180892944336, 16.80328369140625, 17.40475845336914, 18.0062313079834, 18.60770606994629, 19.20918083190918, 19.810653686523438, 20.412128448486328]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 3.0, 9.0, 5.0, 15.0, 13.0, 15.0, 14.0, 20.0, 16.0, 18.0, 20.0, 21.0, 29.0, 23.0, 30.0, 30.0, 36.0, 41.0, 44.0, 52.0, 41.0, 44.0, 40.0, 39.0, 36.0, 35.0, 33.0, 32.0, 38.0, 23.0, 20.0, 24.0, 25.0, 12.0, 10.0, 13.0, 13.0, 7.0, 12.0, 11.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.42578125, -2.35235595703125, -2.2789306640625, -2.20550537109375, -2.132080078125, -2.05865478515625, -1.9852294921875, -1.91180419921875, -1.83837890625, -1.76495361328125, -1.6915283203125, -1.61810302734375, -1.544677734375, -1.47125244140625, -1.3978271484375, -1.32440185546875, -1.2509765625, -1.17755126953125, -1.1041259765625, -1.03070068359375, -0.957275390625, -0.88385009765625, -0.8104248046875, -0.73699951171875, -0.66357421875, -0.59014892578125, -0.5167236328125, -0.44329833984375, -0.369873046875, -0.29644775390625, -0.2230224609375, -0.14959716796875, -0.076171875, -0.00274658203125, 0.0706787109375, 0.14410400390625, 0.217529296875, 0.29095458984375, 0.3643798828125, 0.43780517578125, 0.51123046875, 0.58465576171875, 0.6580810546875, 0.73150634765625, 0.804931640625, 0.87835693359375, 0.9517822265625, 1.02520751953125, 1.0986328125, 1.17205810546875, 1.2454833984375, 1.31890869140625, 1.392333984375, 1.46575927734375, 1.5391845703125, 1.61260986328125, 1.68603515625, 1.75946044921875, 1.8328857421875, 1.90631103515625, 1.979736328125, 2.05316162109375, 2.1265869140625, 2.20001220703125, 2.2734375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 10.0, 10.0, 17.0, 24.0, 37.0, 45.0, 83.0, 105.0, 149.0, 232.0, 384.0, 533.0, 819.0, 1184.0, 1723.0, 2551.0, 3651.0, 5387.0, 7826.0, 11184.0, 16615.0, 25372.0, 40039.0, 66139.0, 122234.0, 264629.0, 215312.0, 100836.0, 56405.0, 34962.0, 22674.0, 15127.0, 10316.0, 6886.0, 4774.0, 3258.0, 2317.0, 1443.0, 1045.0, 753.0, 491.0, 325.0, 229.0, 131.0, 99.0, 64.0, 47.0, 41.0, 16.0, 11.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4189453125, -0.4053688049316406, -0.39179229736328125, -0.3782157897949219, -0.3646392822265625, -0.3510627746582031, -0.33748626708984375, -0.3239097595214844, -0.310333251953125, -0.2967567443847656, -0.28318023681640625, -0.2696037292480469, -0.2560272216796875, -0.24245071411132812, -0.22887420654296875, -0.21529769897460938, -0.20172119140625, -0.18814468383789062, -0.17456817626953125, -0.16099166870117188, -0.1474151611328125, -0.13383865356445312, -0.12026214599609375, -0.10668563842773438, -0.093109130859375, -0.07953262329101562, -0.06595611572265625, -0.052379608154296875, -0.0388031005859375, -0.025226593017578125, -0.01165008544921875, 0.001926422119140625, 0.0155029296875, 0.029079437255859375, 0.04265594482421875, 0.056232452392578125, 0.0698089599609375, 0.08338546752929688, 0.09696197509765625, 0.11053848266601562, 0.124114990234375, 0.13769149780273438, 0.15126800537109375, 0.16484451293945312, 0.1784210205078125, 0.19199752807617188, 0.20557403564453125, 0.21915054321289062, 0.23272705078125, 0.24630355834960938, 0.25988006591796875, 0.2734565734863281, 0.2870330810546875, 0.3006095886230469, 0.31418609619140625, 0.3277626037597656, 0.341339111328125, 0.3549156188964844, 0.36849212646484375, 0.3820686340332031, 0.3956451416015625, 0.4092216491699219, 0.42279815673828125, 0.4363746643066406, 0.449951171875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 7.0, 7.0, 14.0, 13.0, 11.0, 9.0, 24.0, 25.0, 23.0, 20.0, 23.0, 22.0, 30.0, 24.0, 38.0, 38.0, 50.0, 37.0, 43.0, 1063.0, 42.0, 40.0, 47.0, 39.0, 36.0, 28.0, 31.0, 36.0, 18.0, 30.0, 27.0, 18.0, 21.0, 11.0, 12.0, 15.0, 7.0, 10.0, 8.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.53125, -1.4826507568359375, -1.434051513671875, -1.3854522705078125, -1.33685302734375, -1.2882537841796875, -1.239654541015625, -1.1910552978515625, -1.1424560546875, -1.0938568115234375, -1.045257568359375, -0.9966583251953125, -0.94805908203125, -0.8994598388671875, -0.850860595703125, -0.8022613525390625, -0.753662109375, -0.7050628662109375, -0.656463623046875, -0.6078643798828125, -0.55926513671875, -0.5106658935546875, -0.462066650390625, -0.4134674072265625, -0.3648681640625, -0.3162689208984375, -0.267669677734375, -0.2190704345703125, -0.17047119140625, -0.1218719482421875, -0.073272705078125, -0.0246734619140625, 0.02392578125, 0.0725250244140625, 0.121124267578125, 0.1697235107421875, 0.21832275390625, 0.2669219970703125, 0.315521240234375, 0.3641204833984375, 0.4127197265625, 0.4613189697265625, 0.509918212890625, 0.5585174560546875, 0.60711669921875, 0.6557159423828125, 0.704315185546875, 0.7529144287109375, 0.801513671875, 0.8501129150390625, 0.898712158203125, 0.9473114013671875, 0.99591064453125, 1.0445098876953125, 1.093109130859375, 1.1417083740234375, 1.1903076171875, 1.2389068603515625, 1.287506103515625, 1.3361053466796875, 1.38470458984375, 1.4333038330078125, 1.481903076171875, 1.5305023193359375, 1.5791015625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 18.0, 19.0, 28.0, 53.0, 61.0, 78.0, 130.0, 195.0, 261.0, 422.0, 662.0, 947.0, 1447.0, 2107.0, 3272.0, 4734.0, 7312.0, 11066.0, 17337.0, 27105.0, 44512.0, 75686.0, 145470.0, 1343819.0, 181949.0, 89946.0, 50980.0, 30767.0, 19588.0, 12439.0, 8352.0, 5361.0, 3657.0, 2461.0, 1603.0, 1100.0, 734.0, 500.0, 332.0, 206.0, 142.0, 85.0, 66.0, 32.0, 31.0, 25.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.43017578125, -0.4165802001953125, -0.402984619140625, -0.3893890380859375, -0.37579345703125, -0.3621978759765625, -0.348602294921875, -0.3350067138671875, -0.3214111328125, -0.3078155517578125, -0.294219970703125, -0.2806243896484375, -0.26702880859375, -0.2534332275390625, -0.239837646484375, -0.2262420654296875, -0.212646484375, -0.1990509033203125, -0.185455322265625, -0.1718597412109375, -0.15826416015625, -0.1446685791015625, -0.131072998046875, -0.1174774169921875, -0.1038818359375, -0.0902862548828125, -0.076690673828125, -0.0630950927734375, -0.04949951171875, -0.0359039306640625, -0.022308349609375, -0.0087127685546875, 0.0048828125, 0.0184783935546875, 0.032073974609375, 0.0456695556640625, 0.05926513671875, 0.0728607177734375, 0.086456298828125, 0.1000518798828125, 0.1136474609375, 0.1272430419921875, 0.140838623046875, 0.1544342041015625, 0.16802978515625, 0.1816253662109375, 0.195220947265625, 0.2088165283203125, 0.222412109375, 0.2360076904296875, 0.249603271484375, 0.2631988525390625, 0.27679443359375, 0.2903900146484375, 0.303985595703125, 0.3175811767578125, 0.3311767578125, 0.3447723388671875, 0.358367919921875, 0.3719635009765625, 0.38555908203125, 0.3991546630859375, 0.412750244140625, 0.4263458251953125, 0.43994140625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 6.0, 12.0, 9.0, 17.0, 15.0, 12.0, 16.0, 28.0, 25.0, 34.0, 29.0, 51.0, 49.0, 41.0, 46.0, 50.0, 59.0, 50.0, 67.0, 54.0, 54.0, 42.0, 33.0, 37.0, 26.0, 25.0, 13.0, 16.0, 13.0, 14.0, 9.0, 4.0, 8.0, 5.0, 5.0, 1.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0002791881561279297, -0.0002708137035369873, -0.0002624392509460449, -0.00025406479835510254, -0.00024569034576416016, -0.00023731589317321777, -0.0002289414405822754, -0.000220566987991333, -0.00021219253540039062, -0.00020381808280944824, -0.00019544363021850586, -0.00018706917762756348, -0.0001786947250366211, -0.0001703202724456787, -0.00016194581985473633, -0.00015357136726379395, -0.00014519691467285156, -0.00013682246208190918, -0.0001284480094909668, -0.00012007355690002441, -0.00011169910430908203, -0.00010332465171813965, -9.495019912719727e-05, -8.657574653625488e-05, -7.82012939453125e-05, -6.982684135437012e-05, -6.145238876342773e-05, -5.307793617248535e-05, -4.470348358154297e-05, -3.6329030990600586e-05, -2.7954578399658203e-05, -1.958012580871582e-05, -1.1205673217773438e-05, -2.8312206268310547e-06, 5.543231964111328e-06, 1.3917684555053711e-05, 2.2292137145996094e-05, 3.0666589736938477e-05, 3.904104232788086e-05, 4.741549491882324e-05, 5.5789947509765625e-05, 6.416440010070801e-05, 7.253885269165039e-05, 8.091330528259277e-05, 8.928775787353516e-05, 9.766221046447754e-05, 0.00010603666305541992, 0.0001144111156463623, 0.0001227855682373047, 0.00013116002082824707, 0.00013953447341918945, 0.00014790892601013184, 0.00015628337860107422, 0.0001646578311920166, 0.00017303228378295898, 0.00018140673637390137, 0.00018978118896484375, 0.00019815564155578613, 0.00020653009414672852, 0.0002149045467376709, 0.00022327899932861328, 0.00023165345191955566, 0.00024002790451049805, 0.00024840235710144043, 0.0002567768096923828]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 7.0, 5.0, 7.0, 5.0, 11.0, 18.0, 13.0, 26.0, 30.0, 42.0, 41.0, 62.0, 73.0, 145.0, 236.0, 400.0, 806.0, 5103.0, 996327.0, 42811.0, 1104.0, 461.0, 233.0, 162.0, 103.0, 79.0, 54.0, 41.0, 26.0, 16.0, 26.0, 12.0, 9.0, 9.0, 10.0, 13.0, 9.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00519561767578125, -0.0050261616706848145, -0.004856705665588379, -0.004687249660491943, -0.004517793655395508, -0.004348337650299072, -0.004178881645202637, -0.004009425640106201, -0.0038399696350097656, -0.00367051362991333, -0.0035010576248168945, -0.003331601619720459, -0.0031621456146240234, -0.002992689609527588, -0.0028232336044311523, -0.002653777599334717, -0.0024843215942382812, -0.0023148655891418457, -0.00214540958404541, -0.0019759535789489746, -0.001806497573852539, -0.0016370415687561035, -0.001467585563659668, -0.0012981295585632324, -0.0011286735534667969, -0.0009592175483703613, -0.0007897615432739258, -0.0006203055381774902, -0.0004508495330810547, -0.00028139352798461914, -0.0001119375228881836, 5.751848220825195e-05, 0.0002269744873046875, 0.00039643049240112305, 0.0005658864974975586, 0.0007353425025939941, 0.0009047985076904297, 0.0010742545127868652, 0.0012437105178833008, 0.0014131665229797363, 0.0015826225280761719, 0.0017520785331726074, 0.001921534538269043, 0.0020909905433654785, 0.002260446548461914, 0.0024299025535583496, 0.002599358558654785, 0.0027688145637512207, 0.0029382705688476562, 0.003107726573944092, 0.0032771825790405273, 0.003446638584136963, 0.0036160945892333984, 0.003785550594329834, 0.0039550065994262695, 0.004124462604522705, 0.004293918609619141, 0.004463374614715576, 0.004632830619812012, 0.004802286624908447, 0.004971742630004883, 0.005141198635101318, 0.005310654640197754, 0.0054801106452941895, 0.005649566650390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 11.0, 62.0, 204.0, 405.0, 253.0, 63.0, 16.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009686995763331652, -0.0009487346396781504, -0.0009287697612307966, -0.0009088048245757818, -0.0008888398879207671, -0.0008688750094734132, -0.0008489100728183985, -0.0008289451943710446, -0.0008089802577160299, -0.0007890153210610151, -0.0007690504426136613, -0.0007490855059586465, -0.0007291205693036318, -0.0007091556908562779, -0.0006891907542012632, -0.0006692258175462484, -0.0006492609390988946, -0.0006292960024438798, -0.000609331123996526, -0.0005893661873415112, -0.0005694012506864965, -0.0005494363722391427, -0.0005294714355841279, -0.0005095065571367741, -0.0004895415622740984, -0.0004695766547229141, -0.00044961171806789935, -0.00042964681051671505, -0.00040968190296553075, -0.00038971699541434646, -0.0003697520587593317, -0.0003497871512081474, -0.0003298222436569631, -0.0003098573361057788, -0.00028989239945076406, -0.00026992749189957976, -0.00024996258434839547, -0.00022999766224529594, -0.00021003274014219642, -0.00019006783259101212, -0.0001701029104879126, -0.00015013798838481307, -0.00013017308083362877, -0.00011020815873052925, -9.024324390338734e-05, -7.027832907624543e-05, -5.03134069731459e-05, -3.0348499421961606e-05, -1.038357731886208e-05, 9.581339327269234e-06, 2.9546255973400548e-05, 4.9511174438521266e-05, 6.947608926566318e-05, 8.944100409280509e-05, 0.00010940592619590461, 0.0001293708337470889, 0.00014933575585018843, 0.00016930067795328796, 0.00018926558550447226, 0.00020923050760757178, 0.0002291954297106713, 0.0002491603372618556, 0.00026912527391687036, 0.0002890901523642242, 0.00030905508901923895]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 8.0, 9.0, 12.0, 10.0, 7.0, 13.0, 12.0, 24.0, 22.0, 21.0, 29.0, 40.0, 27.0, 37.0, 35.0, 49.0, 37.0, 38.0, 57.0, 39.0, 47.0, 43.0, 51.0, 38.0, 35.0, 30.0, 23.0, 27.0, 31.0, 25.0, 22.0, 17.0, 17.0, 12.0, 15.0, 6.0, 10.0, 5.0, 8.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015354156494140625, -0.00014870613813400269, -0.00014387071132659912, -0.00013903528451919556, -0.000134199857711792, -0.00012936443090438843, -0.00012452900409698486, -0.0001196935772895813, -0.00011485815048217773, -0.00011002272367477417, -0.0001051872968673706, -0.00010035187005996704, -9.551644325256348e-05, -9.068101644515991e-05, -8.584558963775635e-05, -8.101016283035278e-05, -7.617473602294922e-05, -7.133930921554565e-05, -6.650388240814209e-05, -6.166845560073853e-05, -5.683302879333496e-05, -5.1997601985931396e-05, -4.716217517852783e-05, -4.232674837112427e-05, -3.74913215637207e-05, -3.265589475631714e-05, -2.7820467948913574e-05, -2.298504114151001e-05, -1.8149614334106445e-05, -1.3314187526702881e-05, -8.478760719299316e-06, -3.643333911895752e-06, 1.1920928955078125e-06, 6.027519702911377e-06, 1.0862946510314941e-05, 1.5698373317718506e-05, 2.053380012512207e-05, 2.5369226932525635e-05, 3.02046537399292e-05, 3.5040080547332764e-05, 3.987550735473633e-05, 4.471093416213989e-05, 4.954636096954346e-05, 5.438178777694702e-05, 5.9217214584350586e-05, 6.405264139175415e-05, 6.888806819915771e-05, 7.372349500656128e-05, 7.855892181396484e-05, 8.339434862136841e-05, 8.822977542877197e-05, 9.306520223617554e-05, 9.79006290435791e-05, 0.00010273605585098267, 0.00010757148265838623, 0.0001124069094657898, 0.00011724233627319336, 0.00012207776308059692, 0.0001269131898880005, 0.00013174861669540405, 0.00013658404350280762, 0.00014141947031021118, 0.00014625489711761475, 0.0001510903239250183, 0.00015592575073242188]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 3.0, 9.0, 5.0, 15.0, 13.0, 15.0, 14.0, 20.0, 16.0, 18.0, 20.0, 21.0, 29.0, 23.0, 30.0, 30.0, 36.0, 41.0, 44.0, 52.0, 41.0, 44.0, 40.0, 39.0, 36.0, 35.0, 33.0, 32.0, 38.0, 23.0, 20.0, 24.0, 25.0, 12.0, 10.0, 13.0, 13.0, 7.0, 12.0, 11.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.42578125, -2.35235595703125, -2.2789306640625, -2.20550537109375, -2.132080078125, -2.05865478515625, -1.9852294921875, -1.91180419921875, -1.83837890625, -1.76495361328125, -1.6915283203125, -1.61810302734375, -1.544677734375, -1.47125244140625, -1.3978271484375, -1.32440185546875, -1.2509765625, -1.17755126953125, -1.1041259765625, -1.03070068359375, -0.957275390625, -0.88385009765625, -0.8104248046875, -0.73699951171875, -0.66357421875, -0.59014892578125, -0.5167236328125, -0.44329833984375, -0.369873046875, -0.29644775390625, -0.2230224609375, -0.14959716796875, -0.076171875, -0.00274658203125, 0.0706787109375, 0.14410400390625, 0.217529296875, 0.29095458984375, 0.3643798828125, 0.43780517578125, 0.51123046875, 0.58465576171875, 0.6580810546875, 0.73150634765625, 0.804931640625, 0.87835693359375, 0.9517822265625, 1.02520751953125, 1.0986328125, 1.17205810546875, 1.2454833984375, 1.31890869140625, 1.392333984375, 1.46575927734375, 1.5391845703125, 1.61260986328125, 1.68603515625, 1.75946044921875, 1.8328857421875, 1.90631103515625, 1.979736328125, 2.05316162109375, 2.1265869140625, 2.20001220703125, 2.2734375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 11.0, 19.0, 30.0, 35.0, 49.0, 71.0, 114.0, 140.0, 237.0, 321.0, 538.0, 1039.0, 2322.0, 6001.0, 16627.0, 44756.0, 114712.0, 287360.0, 343159.0, 140792.0, 55805.0, 21025.0, 7433.0, 2930.0, 1191.0, 658.0, 403.0, 247.0, 155.0, 112.0, 71.0, 57.0, 36.0, 34.0, 13.0, 12.0, 12.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.326171875, -3.228668212890625, -3.13116455078125, -3.033660888671875, -2.9361572265625, -2.838653564453125, -2.74114990234375, -2.643646240234375, -2.546142578125, -2.448638916015625, -2.35113525390625, -2.253631591796875, -2.1561279296875, -2.058624267578125, -1.96112060546875, -1.863616943359375, -1.76611328125, -1.668609619140625, -1.57110595703125, -1.473602294921875, -1.3760986328125, -1.278594970703125, -1.18109130859375, -1.083587646484375, -0.986083984375, -0.888580322265625, -0.79107666015625, -0.693572998046875, -0.5960693359375, -0.498565673828125, -0.40106201171875, -0.303558349609375, -0.2060546875, -0.108551025390625, -0.01104736328125, 0.086456298828125, 0.1839599609375, 0.281463623046875, 0.37896728515625, 0.476470947265625, 0.573974609375, 0.671478271484375, 0.76898193359375, 0.866485595703125, 0.9639892578125, 1.061492919921875, 1.15899658203125, 1.256500244140625, 1.35400390625, 1.451507568359375, 1.54901123046875, 1.646514892578125, 1.7440185546875, 1.841522216796875, 1.93902587890625, 2.036529541015625, 2.134033203125, 2.231536865234375, 2.32904052734375, 2.426544189453125, 2.5240478515625, 2.621551513671875, 2.71905517578125, 2.816558837890625, 2.9140625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 7.0, 10.0, 10.0, 15.0, 15.0, 14.0, 26.0, 22.0, 33.0, 24.0, 44.0, 33.0, 43.0, 49.0, 85.0, 125.0, 335.0, 1451.0, 185.0, 93.0, 72.0, 45.0, 33.0, 43.0, 31.0, 36.0, 20.0, 33.0, 23.0, 20.0, 13.0, 11.0, 19.0, 5.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8515625, -7.5513916015625, -7.251220703125, -6.9510498046875, -6.65087890625, -6.3507080078125, -6.050537109375, -5.7503662109375, -5.4501953125, -5.1500244140625, -4.849853515625, -4.5496826171875, -4.24951171875, -3.9493408203125, -3.649169921875, -3.3489990234375, -3.048828125, -2.7486572265625, -2.448486328125, -2.1483154296875, -1.84814453125, -1.5479736328125, -1.247802734375, -0.9476318359375, -0.6474609375, -0.3472900390625, -0.047119140625, 0.2530517578125, 0.55322265625, 0.8533935546875, 1.153564453125, 1.4537353515625, 1.75390625, 2.0540771484375, 2.354248046875, 2.6544189453125, 2.95458984375, 3.2547607421875, 3.554931640625, 3.8551025390625, 4.1552734375, 4.4554443359375, 4.755615234375, 5.0557861328125, 5.35595703125, 5.6561279296875, 5.956298828125, 6.2564697265625, 6.556640625, 6.8568115234375, 7.156982421875, 7.4571533203125, 7.75732421875, 8.0574951171875, 8.357666015625, 8.6578369140625, 8.9580078125, 9.2581787109375, 9.558349609375, 9.8585205078125, 10.15869140625, 10.4588623046875, 10.759033203125, 11.0592041015625, 11.359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 6.0, 13.0, 10.0, 17.0, 22.0, 33.0, 31.0, 40.0, 59.0, 76.0, 115.0, 168.0, 232.0, 413.0, 1152.0, 49961.0, 3085490.0, 6176.0, 680.0, 318.0, 188.0, 115.0, 88.0, 65.0, 59.0, 46.0, 25.0, 16.0, 11.0, 12.0, 8.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.046875, -26.057373046875, -25.06787109375, -24.078369140625, -23.0888671875, -22.099365234375, -21.10986328125, -20.120361328125, -19.130859375, -18.141357421875, -17.15185546875, -16.162353515625, -15.1728515625, -14.183349609375, -13.19384765625, -12.204345703125, -11.21484375, -10.225341796875, -9.23583984375, -8.246337890625, -7.2568359375, -6.267333984375, -5.27783203125, -4.288330078125, -3.298828125, -2.309326171875, -1.31982421875, -0.330322265625, 0.6591796875, 1.648681640625, 2.63818359375, 3.627685546875, 4.6171875, 5.606689453125, 6.59619140625, 7.585693359375, 8.5751953125, 9.564697265625, 10.55419921875, 11.543701171875, 12.533203125, 13.522705078125, 14.51220703125, 15.501708984375, 16.4912109375, 17.480712890625, 18.47021484375, 19.459716796875, 20.44921875, 21.438720703125, 22.42822265625, 23.417724609375, 24.4072265625, 25.396728515625, 26.38623046875, 27.375732421875, 28.365234375, 29.354736328125, 30.34423828125, 31.333740234375, 32.3232421875, 33.312744140625, 34.30224609375, 35.291748046875, 36.28125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 7.0, 260.0, 724.0, 27.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.614267349243164, -20.674463272094727, -16.73465919494629, -12.794856071472168, -8.85505199432373, -4.915248870849609, -0.9754447937011719, 2.9643592834472656, 6.904163360595703, 10.84396743774414, 14.783771514892578, 18.723575592041016, 22.663379669189453, 26.603181838989258, 30.542985916137695, 34.4827880859375, 38.42259216308594, 42.362396240234375, 46.30220031738281, 50.24200439453125, 54.18180847167969, 58.121612548828125, 62.06141662597656, 66.001220703125, 69.94102478027344, 73.88082885742188, 77.82063293457031, 81.76043701171875, 85.70024108886719, 89.64004516601562, 93.57984924316406, 97.5196533203125, 101.4594497680664, 105.39925384521484, 109.33905792236328, 113.27886199951172, 117.21866607666016, 121.1584701538086, 125.09827423095703, 129.03807067871094, 132.97787475585938, 136.9176788330078, 140.85748291015625, 144.7972869873047, 148.73709106445312, 152.67689514160156, 156.61669921875, 160.55650329589844, 164.49630737304688, 168.4361114501953, 172.37591552734375, 176.3157196044922, 180.25552368164062, 184.19532775878906, 188.1351318359375, 192.07493591308594, 196.01473999023438, 199.9545440673828, 203.89434814453125, 207.8341522216797, 211.77395629882812, 215.71376037597656, 219.653564453125, 223.59336853027344, 227.53317260742188]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 9.0, 12.0, 6.0, 7.0, 7.0, 15.0, 10.0, 18.0, 18.0, 22.0, 25.0, 35.0, 33.0, 24.0, 30.0, 40.0, 36.0, 38.0, 40.0, 44.0, 46.0, 35.0, 45.0, 43.0, 32.0, 29.0, 31.0, 34.0, 24.0, 31.0, 33.0, 25.0, 20.0, 21.0, 19.0, 13.0, 8.0, 8.0, 7.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-29.23430061340332, -28.441085815429688, -27.647872924804688, -26.854658126831055, -26.061443328857422, -25.268230438232422, -24.47501564025879, -23.681800842285156, -22.888587951660156, -22.095373153686523, -21.302160263061523, -20.50894546508789, -19.715730667114258, -18.922515869140625, -18.129302978515625, -17.336088180541992, -16.54287338256836, -15.749659538269043, -14.95644474029541, -14.163230895996094, -13.370016098022461, -12.576802253723145, -11.783588409423828, -10.990373611450195, -10.197159767150879, -9.403945922851562, -8.61073112487793, -7.817517280578613, -7.024302959442139, -6.231088638305664, -5.437874794006348, -4.644660472869873, -3.8514480590820312, -3.0582337379455566, -2.265019655227661, -1.4718055725097656, -0.678591251373291, 0.1146230697631836, 0.9078369140625, 1.7010512351989746, 2.494265556335449, 3.287479877471924, 4.080694198608398, 4.873908042907715, 5.6671223640441895, 6.460336685180664, 7.2535505294799805, 8.046764373779297, 8.83997917175293, 9.633193016052246, 10.426407814025879, 11.219621658325195, 12.012836456298828, 12.806050300598145, 13.599264144897461, 14.392478942871094, 15.18569278717041, 15.978906631469727, 16.77212142944336, 17.56533432006836, 18.358549118041992, 19.151763916015625, 19.944976806640625, 20.738191604614258, 21.53140640258789]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 2.0, 6.0, 7.0, 5.0, 5.0, 11.0, 18.0, 12.0, 13.0, 15.0, 19.0, 22.0, 24.0, 26.0, 41.0, 28.0, 31.0, 46.0, 38.0, 41.0, 46.0, 48.0, 50.0, 37.0, 35.0, 46.0, 38.0, 44.0, 29.0, 24.0, 29.0, 32.0, 18.0, 14.0, 22.0, 8.0, 10.0, 14.0, 11.0, 5.0, 9.0, 7.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.904296875, -2.813507080078125, -2.72271728515625, -2.631927490234375, -2.5411376953125, -2.450347900390625, -2.35955810546875, -2.268768310546875, -2.177978515625, -2.087188720703125, -1.99639892578125, -1.905609130859375, -1.8148193359375, -1.724029541015625, -1.63323974609375, -1.542449951171875, -1.45166015625, -1.360870361328125, -1.27008056640625, -1.179290771484375, -1.0885009765625, -0.997711181640625, -0.90692138671875, -0.816131591796875, -0.725341796875, -0.634552001953125, -0.54376220703125, -0.452972412109375, -0.3621826171875, -0.271392822265625, -0.18060302734375, -0.089813232421875, 0.0009765625, 0.091766357421875, 0.18255615234375, 0.273345947265625, 0.3641357421875, 0.454925537109375, 0.54571533203125, 0.636505126953125, 0.727294921875, 0.818084716796875, 0.90887451171875, 0.999664306640625, 1.0904541015625, 1.181243896484375, 1.27203369140625, 1.362823486328125, 1.45361328125, 1.544403076171875, 1.63519287109375, 1.725982666015625, 1.8167724609375, 1.907562255859375, 1.99835205078125, 2.089141845703125, 2.179931640625, 2.270721435546875, 2.36151123046875, 2.452301025390625, 2.5430908203125, 2.633880615234375, 2.72467041015625, 2.815460205078125, 2.90625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 10.0, 9.0, 15.0, 11.0, 18.0, 14.0, 14.0, 20.0, 19.0, 39.0, 45.0, 43.0, 65.0, 139.0, 293.0, 850.0, 4361.0, 120869.0, 2561323.0, 1463866.0, 38001.0, 2667.0, 786.0, 279.0, 162.0, 80.0, 51.0, 38.0, 22.0, 19.0, 27.0, 19.0, 10.0, 14.0, 5.0, 10.0, 9.0, 10.0, 8.0, 12.0, 0.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.609375, -9.31689453125, -9.0244140625, -8.73193359375, -8.439453125, -8.14697265625, -7.8544921875, -7.56201171875, -7.26953125, -6.97705078125, -6.6845703125, -6.39208984375, -6.099609375, -5.80712890625, -5.5146484375, -5.22216796875, -4.9296875, -4.63720703125, -4.3447265625, -4.05224609375, -3.759765625, -3.46728515625, -3.1748046875, -2.88232421875, -2.58984375, -2.29736328125, -2.0048828125, -1.71240234375, -1.419921875, -1.12744140625, -0.8349609375, -0.54248046875, -0.25, 0.04248046875, 0.3349609375, 0.62744140625, 0.919921875, 1.21240234375, 1.5048828125, 1.79736328125, 2.08984375, 2.38232421875, 2.6748046875, 2.96728515625, 3.259765625, 3.55224609375, 3.8447265625, 4.13720703125, 4.4296875, 4.72216796875, 5.0146484375, 5.30712890625, 5.599609375, 5.89208984375, 6.1845703125, 6.47705078125, 6.76953125, 7.06201171875, 7.3544921875, 7.64697265625, 7.939453125, 8.23193359375, 8.5244140625, 8.81689453125, 9.109375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 14.0, 17.0, 16.0, 22.0, 38.0, 51.0, 60.0, 91.0, 110.0, 174.0, 222.0, 274.0, 322.0, 370.0, 399.0, 384.0, 356.0, 275.0, 202.0, 159.0, 123.0, 109.0, 67.0, 48.0, 50.0, 30.0, 23.0, 14.0, 11.0, 5.0, 8.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.71875, -5.5430908203125, -5.367431640625, -5.1917724609375, -5.01611328125, -4.8404541015625, -4.664794921875, -4.4891357421875, -4.3134765625, -4.1378173828125, -3.962158203125, -3.7864990234375, -3.61083984375, -3.4351806640625, -3.259521484375, -3.0838623046875, -2.908203125, -2.7325439453125, -2.556884765625, -2.3812255859375, -2.20556640625, -2.0299072265625, -1.854248046875, -1.6785888671875, -1.5029296875, -1.3272705078125, -1.151611328125, -0.9759521484375, -0.80029296875, -0.6246337890625, -0.448974609375, -0.2733154296875, -0.09765625, 0.0780029296875, 0.253662109375, 0.4293212890625, 0.60498046875, 0.7806396484375, 0.956298828125, 1.1319580078125, 1.3076171875, 1.4832763671875, 1.658935546875, 1.8345947265625, 2.01025390625, 2.1859130859375, 2.361572265625, 2.5372314453125, 2.712890625, 2.8885498046875, 3.064208984375, 3.2398681640625, 3.41552734375, 3.5911865234375, 3.766845703125, 3.9425048828125, 4.1181640625, 4.2938232421875, 4.469482421875, 4.6451416015625, 4.82080078125, 4.9964599609375, 5.172119140625, 5.3477783203125, 5.5234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 8.0, 9.0, 9.0, 17.0, 16.0, 31.0, 49.0, 62.0, 91.0, 106.0, 182.0, 214.0, 285.0, 504.0, 1217.0, 25683.0, 3447004.0, 712177.0, 4573.0, 729.0, 388.0, 264.0, 190.0, 125.0, 99.0, 70.0, 49.0, 35.0, 25.0, 22.0, 13.0, 14.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.03125, -17.405029296875, -16.77880859375, -16.152587890625, -15.5263671875, -14.900146484375, -14.27392578125, -13.647705078125, -13.021484375, -12.395263671875, -11.76904296875, -11.142822265625, -10.5166015625, -9.890380859375, -9.26416015625, -8.637939453125, -8.01171875, -7.385498046875, -6.75927734375, -6.133056640625, -5.5068359375, -4.880615234375, -4.25439453125, -3.628173828125, -3.001953125, -2.375732421875, -1.74951171875, -1.123291015625, -0.4970703125, 0.129150390625, 0.75537109375, 1.381591796875, 2.0078125, 2.634033203125, 3.26025390625, 3.886474609375, 4.5126953125, 5.138916015625, 5.76513671875, 6.391357421875, 7.017578125, 7.643798828125, 8.27001953125, 8.896240234375, 9.5224609375, 10.148681640625, 10.77490234375, 11.401123046875, 12.02734375, 12.653564453125, 13.27978515625, 13.906005859375, 14.5322265625, 15.158447265625, 15.78466796875, 16.410888671875, 17.037109375, 17.663330078125, 18.28955078125, 18.915771484375, 19.5419921875, 20.168212890625, 20.79443359375, 21.420654296875, 22.046875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 56.0, 244.0, 411.0, 238.0, 54.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.37199401855469, -96.48629760742188, -93.60060119628906, -90.71491241455078, -87.82921600341797, -84.94351959228516, -82.05783081054688, -79.17213439941406, -76.28643798828125, -73.40074157714844, -70.51504516601562, -67.62935638427734, -64.74365997314453, -61.85796356201172, -58.97227096557617, -56.086578369140625, -53.20088195800781, -50.315185546875, -47.42949295043945, -44.543800354003906, -41.658103942871094, -38.77240753173828, -35.886714935302734, -33.00102233886719, -30.115325927734375, -27.229631423950195, -24.343936920166016, -21.458242416381836, -18.572547912597656, -15.686853408813477, -12.801158905029297, -9.915464401245117, -7.0297698974609375, -4.144075393676758, -1.2583808898925781, 1.6273136138916016, 4.513008117675781, 7.398702621459961, 10.28439712524414, 13.17009162902832, 16.0557861328125, 18.94148063659668, 21.82717514038086, 24.71286964416504, 27.59856414794922, 30.4842586517334, 33.36995315551758, 36.255645751953125, 39.14134216308594, 42.02703857421875, 44.9127311706543, 47.798423767089844, 50.684120178222656, 53.56981658935547, 56.455509185791016, 59.34120178222656, 62.226898193359375, 65.11259460449219, 67.998291015625, 70.88397979736328, 73.7696762084961, 76.6553726196289, 79.54106140136719, 82.4267578125, 85.31245422363281]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 10.0, 13.0, 14.0, 17.0, 21.0, 16.0, 22.0, 24.0, 31.0, 39.0, 41.0, 40.0, 38.0, 35.0, 43.0, 49.0, 41.0, 44.0, 52.0, 49.0, 35.0, 46.0, 31.0, 34.0, 35.0, 30.0, 24.0, 18.0, 15.0, 12.0, 7.0, 11.0, 11.0, 5.0, 12.0, 10.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.26325225830078, -18.639440536499023, -18.015626907348633, -17.391815185546875, -16.768003463745117, -16.14419174194336, -15.520378112792969, -14.896566390991211, -14.272753715515137, -13.648941040039062, -13.025129318237305, -12.40131664276123, -11.777503967285156, -11.153692245483398, -10.529879570007324, -9.90606689453125, -9.282255172729492, -8.658442497253418, -8.03463077545166, -7.410818099975586, -6.78700590133667, -6.163193702697754, -5.53938102722168, -4.915568828582764, -4.291756629943848, -3.6679444313049316, -3.0441319942474365, -2.4203195571899414, -1.7965073585510254, -1.1726951599121094, -0.5488827228546143, 0.07492971420288086, 0.6987419128417969, 1.3225542306900024, 1.946366548538208, 2.570178985595703, 3.193991184234619, 3.817803382873535, 4.441616058349609, 5.065428256988525, 5.689240455627441, 6.313052654266357, 6.936864852905273, 7.560677528381348, 8.184490203857422, 8.80830192565918, 9.432114601135254, 10.055927276611328, 10.679738998413086, 11.30355167388916, 11.927363395690918, 12.551176071166992, 13.17498779296875, 13.798800468444824, 14.422613143920898, 15.046424865722656, 15.67023754119873, 16.294050216674805, 16.917861938476562, 17.54167366027832, 18.16548728942871, 18.78929901123047, 19.413110733032227, 20.036924362182617, 20.660736083984375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 9.0, 10.0, 15.0, 22.0, 15.0, 25.0, 22.0, 34.0, 35.0, 29.0, 35.0, 37.0, 41.0, 43.0, 49.0, 42.0, 51.0, 39.0, 52.0, 37.0, 43.0, 42.0, 36.0, 29.0, 33.0, 24.0, 18.0, 32.0, 21.0, 14.0, 10.0, 6.0, 10.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.019744873046875, -2.92620849609375, -2.832672119140625, -2.7391357421875, -2.645599365234375, -2.55206298828125, -2.458526611328125, -2.364990234375, -2.271453857421875, -2.17791748046875, -2.084381103515625, -1.9908447265625, -1.897308349609375, -1.80377197265625, -1.710235595703125, -1.61669921875, -1.523162841796875, -1.42962646484375, -1.336090087890625, -1.2425537109375, -1.149017333984375, -1.05548095703125, -0.961944580078125, -0.868408203125, -0.774871826171875, -0.68133544921875, -0.587799072265625, -0.4942626953125, -0.400726318359375, -0.30718994140625, -0.213653564453125, -0.1201171875, -0.026580810546875, 0.06695556640625, 0.160491943359375, 0.2540283203125, 0.347564697265625, 0.44110107421875, 0.534637451171875, 0.628173828125, 0.721710205078125, 0.81524658203125, 0.908782958984375, 1.0023193359375, 1.095855712890625, 1.18939208984375, 1.282928466796875, 1.37646484375, 1.470001220703125, 1.56353759765625, 1.657073974609375, 1.7506103515625, 1.844146728515625, 1.93768310546875, 2.031219482421875, 2.124755859375, 2.218292236328125, 2.31182861328125, 2.405364990234375, 2.4989013671875, 2.592437744140625, 2.68597412109375, 2.779510498046875, 2.873046875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 10.0, 10.0, 14.0, 13.0, 22.0, 36.0, 37.0, 63.0, 102.0, 127.0, 211.0, 299.0, 462.0, 780.0, 1129.0, 1866.0, 2919.0, 4876.0, 7488.0, 12303.0, 19930.0, 32437.0, 54822.0, 103209.0, 232474.0, 289340.0, 123512.0, 63711.0, 36927.0, 22611.0, 13801.0, 8593.0, 5287.0, 3303.0, 2123.0, 1243.0, 850.0, 561.0, 340.0, 247.0, 163.0, 104.0, 68.0, 51.0, 28.0, 25.0, 10.0, 10.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.52197265625, -0.5046463012695312, -0.4873199462890625, -0.46999359130859375, -0.452667236328125, -0.43534088134765625, -0.4180145263671875, -0.40068817138671875, -0.38336181640625, -0.36603546142578125, -0.3487091064453125, -0.33138275146484375, -0.314056396484375, -0.29673004150390625, -0.2794036865234375, -0.26207733154296875, -0.2447509765625, -0.22742462158203125, -0.2100982666015625, -0.19277191162109375, -0.175445556640625, -0.15811920166015625, -0.1407928466796875, -0.12346649169921875, -0.10614013671875, -0.08881378173828125, -0.0714874267578125, -0.05416107177734375, -0.036834716796875, -0.01950836181640625, -0.0021820068359375, 0.01514434814453125, 0.032470703125, 0.04979705810546875, 0.0671234130859375, 0.08444976806640625, 0.101776123046875, 0.11910247802734375, 0.1364288330078125, 0.15375518798828125, 0.17108154296875, 0.18840789794921875, 0.2057342529296875, 0.22306060791015625, 0.240386962890625, 0.25771331787109375, 0.2750396728515625, 0.29236602783203125, 0.3096923828125, 0.32701873779296875, 0.3443450927734375, 0.36167144775390625, 0.378997802734375, 0.39632415771484375, 0.4136505126953125, 0.43097686767578125, 0.44830322265625, 0.46562957763671875, 0.4829559326171875, 0.5002822875976562, 0.517608642578125, 0.5349349975585938, 0.5522613525390625, 0.5695877075195312, 0.5869140625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 5.0, 2.0, 6.0, 5.0, 7.0, 12.0, 6.0, 15.0, 14.0, 10.0, 17.0, 18.0, 30.0, 23.0, 27.0, 34.0, 28.0, 27.0, 32.0, 31.0, 35.0, 48.0, 47.0, 1057.0, 38.0, 38.0, 37.0, 42.0, 33.0, 37.0, 31.0, 31.0, 30.0, 29.0, 25.0, 24.0, 20.0, 14.0, 21.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.640625, -1.5855865478515625, -1.530548095703125, -1.4755096435546875, -1.42047119140625, -1.3654327392578125, -1.310394287109375, -1.2553558349609375, -1.2003173828125, -1.1452789306640625, -1.090240478515625, -1.0352020263671875, -0.98016357421875, -0.9251251220703125, -0.870086669921875, -0.8150482177734375, -0.760009765625, -0.7049713134765625, -0.649932861328125, -0.5948944091796875, -0.53985595703125, -0.4848175048828125, -0.429779052734375, -0.3747406005859375, -0.3197021484375, -0.2646636962890625, -0.209625244140625, -0.1545867919921875, -0.09954833984375, -0.0445098876953125, 0.010528564453125, 0.0655670166015625, 0.12060546875, 0.1756439208984375, 0.230682373046875, 0.2857208251953125, 0.34075927734375, 0.3957977294921875, 0.450836181640625, 0.5058746337890625, 0.5609130859375, 0.6159515380859375, 0.670989990234375, 0.7260284423828125, 0.78106689453125, 0.8361053466796875, 0.891143798828125, 0.9461822509765625, 1.001220703125, 1.0562591552734375, 1.111297607421875, 1.1663360595703125, 1.22137451171875, 1.2764129638671875, 1.331451416015625, 1.3864898681640625, 1.4415283203125, 1.4965667724609375, 1.551605224609375, 1.6066436767578125, 1.66168212890625, 1.7167205810546875, 1.771759033203125, 1.8267974853515625, 1.8818359375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 5.0, 12.0, 8.0, 25.0, 27.0, 44.0, 81.0, 99.0, 163.0, 196.0, 357.0, 468.0, 726.0, 1051.0, 1483.0, 2226.0, 3194.0, 4941.0, 7389.0, 11353.0, 17699.0, 28251.0, 45215.0, 78062.0, 146501.0, 1337546.0, 178003.0, 90189.0, 52024.0, 31605.0, 19887.0, 12868.0, 8464.0, 5580.0, 3675.0, 2521.0, 1687.0, 1135.0, 776.0, 538.0, 326.0, 259.0, 162.0, 105.0, 83.0, 36.0, 33.0, 14.0, 15.0, 18.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.43358612060546875, -0.4184417724609375, -0.40329742431640625, -0.388153076171875, -0.37300872802734375, -0.3578643798828125, -0.34272003173828125, -0.32757568359375, -0.31243133544921875, -0.2972869873046875, -0.28214263916015625, -0.266998291015625, -0.25185394287109375, -0.2367095947265625, -0.22156524658203125, -0.2064208984375, -0.19127655029296875, -0.1761322021484375, -0.16098785400390625, -0.145843505859375, -0.13069915771484375, -0.1155548095703125, -0.10041046142578125, -0.08526611328125, -0.07012176513671875, -0.0549774169921875, -0.03983306884765625, -0.024688720703125, -0.00954437255859375, 0.0055999755859375, 0.02074432373046875, 0.035888671875, 0.05103302001953125, 0.0661773681640625, 0.08132171630859375, 0.096466064453125, 0.11161041259765625, 0.1267547607421875, 0.14189910888671875, 0.15704345703125, 0.17218780517578125, 0.1873321533203125, 0.20247650146484375, 0.217620849609375, 0.23276519775390625, 0.2479095458984375, 0.26305389404296875, 0.2781982421875, 0.29334259033203125, 0.3084869384765625, 0.32363128662109375, 0.338775634765625, 0.35391998291015625, 0.3690643310546875, 0.38420867919921875, 0.39935302734375, 0.41449737548828125, 0.4296417236328125, 0.44478607177734375, 0.459930419921875, 0.47507476806640625, 0.4902191162109375, 0.5053634643554688, 0.5205078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 8.0, 11.0, 15.0, 17.0, 19.0, 25.0, 24.0, 48.0, 51.0, 40.0, 53.0, 59.0, 61.0, 69.0, 66.0, 65.0, 62.0, 48.0, 56.0, 38.0, 29.0, 24.0, 19.0, 14.0, 13.0, 15.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003540515899658203, -0.0003424994647502899, -0.0003309473395347595, -0.0003193952143192291, -0.00030784308910369873, -0.00029629096388816833, -0.00028473883867263794, -0.00027318671345710754, -0.00026163458824157715, -0.00025008246302604675, -0.00023853033781051636, -0.00022697821259498596, -0.00021542608737945557, -0.00020387396216392517, -0.00019232183694839478, -0.00018076971173286438, -0.00016921758651733398, -0.0001576654613018036, -0.0001461133360862732, -0.0001345612108707428, -0.0001230090856552124, -0.00011145696043968201, -9.990483522415161e-05, -8.835271000862122e-05, -7.680058479309082e-05, -6.524845957756042e-05, -5.369633436203003e-05, -4.2144209146499634e-05, -3.059208393096924e-05, -1.9039958715438843e-05, -7.487833499908447e-06, 4.064291715621948e-06, 1.5616416931152344e-05, 2.716854214668274e-05, 3.8720667362213135e-05, 5.027279257774353e-05, 6.182491779327393e-05, 7.337704300880432e-05, 8.492916822433472e-05, 9.648129343986511e-05, 0.00010803341865539551, 0.0001195855438709259, 0.0001311376690864563, 0.0001426897943019867, 0.0001542419195175171, 0.00016579404473304749, 0.00017734616994857788, 0.00018889829516410828, 0.00020045042037963867, 0.00021200254559516907, 0.00022355467081069946, 0.00023510679602622986, 0.00024665892124176025, 0.00025821104645729065, 0.00026976317167282104, 0.00028131529688835144, 0.00029286742210388184, 0.00030441954731941223, 0.0003159716725349426, 0.000327523797750473, 0.0003390759229660034, 0.0003506280481815338, 0.0003621801733970642, 0.0003737322986125946, 0.000385284423828125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 10.0, 7.0, 9.0, 16.0, 18.0, 21.0, 30.0, 29.0, 58.0, 67.0, 107.0, 155.0, 370.0, 863.0, 28850.0, 1014845.0, 1845.0, 527.0, 251.0, 123.0, 107.0, 61.0, 49.0, 30.0, 27.0, 26.0, 13.0, 8.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00848388671875, -0.008228898048400879, -0.007973909378051758, -0.007718920707702637, -0.007463932037353516, -0.0072089433670043945, -0.0069539546966552734, -0.006698966026306152, -0.006443977355957031, -0.00618898868560791, -0.005934000015258789, -0.005679011344909668, -0.005424022674560547, -0.005169034004211426, -0.004914045333862305, -0.004659056663513184, -0.0044040679931640625, -0.004149079322814941, -0.0038940906524658203, -0.0036391019821166992, -0.003384113311767578, -0.003129124641418457, -0.002874135971069336, -0.002619147300720215, -0.0023641586303710938, -0.0021091699600219727, -0.0018541812896728516, -0.0015991926193237305, -0.0013442039489746094, -0.0010892152786254883, -0.0008342266082763672, -0.0005792379379272461, -0.000324249267578125, -6.92605972290039e-05, 0.0001857280731201172, 0.0004407167434692383, 0.0006957054138183594, 0.0009506940841674805, 0.0012056827545166016, 0.0014606714248657227, 0.0017156600952148438, 0.001970648765563965, 0.002225637435913086, 0.002480626106262207, 0.002735614776611328, 0.0029906034469604492, 0.0032455921173095703, 0.0035005807876586914, 0.0037555694580078125, 0.004010558128356934, 0.004265546798706055, 0.004520535469055176, 0.004775524139404297, 0.005030512809753418, 0.005285501480102539, 0.00554049015045166, 0.005795478820800781, 0.006050467491149902, 0.0063054561614990234, 0.0065604448318481445, 0.006815433502197266, 0.007070422172546387, 0.007325410842895508, 0.007580399513244629, 0.00783538818359375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 11.0, 59.0, 313.0, 479.0, 140.0, 13.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006493672262877226, -0.0006214406457729638, -0.0005935140652582049, -0.0005655874847434461, -0.0005376609042286873, -0.0005097342655062675, -0.0004818077140953392, -0.0004538811044767499, -0.00042595452396199107, -0.00039802794344723225, -0.0003701013629324734, -0.0003421747824177146, -0.0003142481727991253, -0.0002863215922843665, -0.00025839501176960766, -0.0002304684167029336, -0.00020254185074009, -0.0001746152702253312, -0.00014668867515865713, -0.00011876209464389831, -9.083550685318187e-05, -6.290891906246543e-05, -3.4982338547706604e-05, -7.05574348103255e-06, 2.0870837033726275e-05, 4.8797424824442714e-05, 7.672401261515915e-05, 0.00010465059312991798, 0.0001325771736446768, 0.00016050376871135086, 0.00018843034922610968, 0.00021635694429278374, 0.00024428352480754256, 0.0002722101053223014, 0.0003001366858370602, 0.00032806326635181904, 0.0003559898759704083, 0.00038391645648516715, 0.00041184303699992597, 0.00043976964661851525, 0.0004676962271332741, 0.0004956228076480329, 0.0005235493881627917, 0.0005514759686775506, 0.0005794025491923094, 0.0006073291879147291, 0.000635255710221827, 0.0006631823489442468, 0.0006911088712513447, 0.0007190354517661035, 0.0007469620322808623, 0.0007748886127956212, 0.00080281519331038, 0.0008307418320327997, 0.0008586683543398976, 0.0008865949930623174, 0.0009145215735770762, 0.000942448154091835, 0.0009703747346065938, 0.0009983013151213527, 0.0010262279538437724, 0.0010541544761508703, 0.00108208111487329, 0.001110007637180388, 0.0011379342759028077]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 1.0, 11.0, 8.0, 17.0, 11.0, 10.0, 16.0, 19.0, 18.0, 34.0, 27.0, 37.0, 46.0, 33.0, 28.0, 33.0, 32.0, 46.0, 49.0, 39.0, 43.0, 41.0, 57.0, 43.0, 40.0, 34.0, 26.0, 33.0, 25.0, 25.0, 27.0, 17.0, 9.0, 15.0, 19.0, 6.0, 2.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016677379608154297, -0.00016130134463310242, -0.00015582889318466187, -0.0001503564417362213, -0.00014488399028778076, -0.0001394115388393402, -0.00013393908739089966, -0.0001284666359424591, -0.00012299418449401855, -0.000117521733045578, -0.00011204928159713745, -0.0001065768301486969, -0.00010110437870025635, -9.56319272518158e-05, -9.015947580337524e-05, -8.468702435493469e-05, -7.921457290649414e-05, -7.374212145805359e-05, -6.826967000961304e-05, -6.279721856117249e-05, -5.7324767112731934e-05, -5.185231566429138e-05, -4.637986421585083e-05, -4.090741276741028e-05, -3.5434961318969727e-05, -2.9962509870529175e-05, -2.4490058422088623e-05, -1.901760697364807e-05, -1.354515552520752e-05, -8.072704076766968e-06, -2.600252628326416e-06, 2.8721988201141357e-06, 8.344650268554688e-06, 1.381710171699524e-05, 1.928955316543579e-05, 2.4762004613876343e-05, 3.0234456062316895e-05, 3.5706907510757446e-05, 4.1179358959198e-05, 4.665181040763855e-05, 5.21242618560791e-05, 5.759671330451965e-05, 6.30691647529602e-05, 6.854161620140076e-05, 7.401406764984131e-05, 7.948651909828186e-05, 8.495897054672241e-05, 9.043142199516296e-05, 9.590387344360352e-05, 0.00010137632489204407, 0.00010684877634048462, 0.00011232122778892517, 0.00011779367923736572, 0.00012326613068580627, 0.00012873858213424683, 0.00013421103358268738, 0.00013968348503112793, 0.00014515593647956848, 0.00015062838792800903, 0.00015610083937644958, 0.00016157329082489014, 0.0001670457422733307, 0.00017251819372177124, 0.0001779906451702118, 0.00018346309661865234]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 9.0, 10.0, 15.0, 22.0, 15.0, 25.0, 22.0, 34.0, 35.0, 29.0, 35.0, 37.0, 41.0, 43.0, 49.0, 42.0, 51.0, 39.0, 52.0, 37.0, 43.0, 42.0, 36.0, 29.0, 33.0, 24.0, 18.0, 32.0, 21.0, 14.0, 10.0, 6.0, 10.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.019744873046875, -2.92620849609375, -2.832672119140625, -2.7391357421875, -2.645599365234375, -2.55206298828125, -2.458526611328125, -2.364990234375, -2.271453857421875, -2.17791748046875, -2.084381103515625, -1.9908447265625, -1.897308349609375, -1.80377197265625, -1.710235595703125, -1.61669921875, -1.523162841796875, -1.42962646484375, -1.336090087890625, -1.2425537109375, -1.149017333984375, -1.05548095703125, -0.961944580078125, -0.868408203125, -0.774871826171875, -0.68133544921875, -0.587799072265625, -0.4942626953125, -0.400726318359375, -0.30718994140625, -0.213653564453125, -0.1201171875, -0.026580810546875, 0.06695556640625, 0.160491943359375, 0.2540283203125, 0.347564697265625, 0.44110107421875, 0.534637451171875, 0.628173828125, 0.721710205078125, 0.81524658203125, 0.908782958984375, 1.0023193359375, 1.095855712890625, 1.18939208984375, 1.282928466796875, 1.37646484375, 1.470001220703125, 1.56353759765625, 1.657073974609375, 1.7506103515625, 1.844146728515625, 1.93768310546875, 2.031219482421875, 2.124755859375, 2.218292236328125, 2.31182861328125, 2.405364990234375, 2.4989013671875, 2.592437744140625, 2.68597412109375, 2.779510498046875, 2.873046875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 5.0, 9.0, 9.0, 19.0, 30.0, 36.0, 37.0, 83.0, 102.0, 153.0, 229.0, 356.0, 606.0, 1353.0, 3057.0, 7094.0, 18274.0, 50284.0, 139139.0, 355003.0, 293246.0, 112702.0, 40715.0, 14908.0, 5818.0, 2512.0, 1188.0, 601.0, 361.0, 184.0, 163.0, 76.0, 64.0, 27.0, 34.0, 16.0, 22.0, 7.0, 8.0, 6.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.41015625, -3.306488037109375, -3.20281982421875, -3.099151611328125, -2.9954833984375, -2.891815185546875, -2.78814697265625, -2.684478759765625, -2.580810546875, -2.477142333984375, -2.37347412109375, -2.269805908203125, -2.1661376953125, -2.062469482421875, -1.95880126953125, -1.855133056640625, -1.75146484375, -1.647796630859375, -1.54412841796875, -1.440460205078125, -1.3367919921875, -1.233123779296875, -1.12945556640625, -1.025787353515625, -0.922119140625, -0.818450927734375, -0.71478271484375, -0.611114501953125, -0.5074462890625, -0.403778076171875, -0.30010986328125, -0.196441650390625, -0.0927734375, 0.010894775390625, 0.11456298828125, 0.218231201171875, 0.3218994140625, 0.425567626953125, 0.52923583984375, 0.632904052734375, 0.736572265625, 0.840240478515625, 0.94390869140625, 1.047576904296875, 1.1512451171875, 1.254913330078125, 1.35858154296875, 1.462249755859375, 1.56591796875, 1.669586181640625, 1.77325439453125, 1.876922607421875, 1.9805908203125, 2.084259033203125, 2.18792724609375, 2.291595458984375, 2.395263671875, 2.498931884765625, 2.60260009765625, 2.706268310546875, 2.8099365234375, 2.913604736328125, 3.01727294921875, 3.120941162109375, 3.224609375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 15.0, 17.0, 25.0, 26.0, 23.0, 31.0, 23.0, 46.0, 52.0, 64.0, 70.0, 137.0, 263.0, 1521.0, 229.0, 93.0, 62.0, 53.0, 46.0, 32.0, 27.0, 31.0, 16.0, 27.0, 19.0, 17.0, 8.0, 6.0, 11.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.40625, -10.0521240234375, -9.697998046875, -9.3438720703125, -8.98974609375, -8.6356201171875, -8.281494140625, -7.9273681640625, -7.5732421875, -7.2191162109375, -6.864990234375, -6.5108642578125, -6.15673828125, -5.8026123046875, -5.448486328125, -5.0943603515625, -4.740234375, -4.3861083984375, -4.031982421875, -3.6778564453125, -3.32373046875, -2.9696044921875, -2.615478515625, -2.2613525390625, -1.9072265625, -1.5531005859375, -1.198974609375, -0.8448486328125, -0.49072265625, -0.1365966796875, 0.217529296875, 0.5716552734375, 0.92578125, 1.2799072265625, 1.634033203125, 1.9881591796875, 2.34228515625, 2.6964111328125, 3.050537109375, 3.4046630859375, 3.7587890625, 4.1129150390625, 4.467041015625, 4.8211669921875, 5.17529296875, 5.5294189453125, 5.883544921875, 6.2376708984375, 6.591796875, 6.9459228515625, 7.300048828125, 7.6541748046875, 8.00830078125, 8.3624267578125, 8.716552734375, 9.0706787109375, 9.4248046875, 9.7789306640625, 10.133056640625, 10.4871826171875, 10.84130859375, 11.1954345703125, 11.549560546875, 11.9036865234375, 12.2578125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 10.0, 3.0, 3.0, 12.0, 14.0, 15.0, 17.0, 21.0, 28.0, 36.0, 56.0, 59.0, 91.0, 151.0, 241.0, 417.0, 1152.0, 19126.0, 3115308.0, 6910.0, 903.0, 371.0, 220.0, 159.0, 104.0, 69.0, 41.0, 33.0, 21.0, 20.0, 15.0, 12.0, 11.0, 8.0, 7.0, 9.0, 6.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.0, -40.70361328125, -39.4072265625, -38.11083984375, -36.814453125, -35.51806640625, -34.2216796875, -32.92529296875, -31.62890625, -30.33251953125, -29.0361328125, -27.73974609375, -26.443359375, -25.14697265625, -23.8505859375, -22.55419921875, -21.2578125, -19.96142578125, -18.6650390625, -17.36865234375, -16.072265625, -14.77587890625, -13.4794921875, -12.18310546875, -10.88671875, -9.59033203125, -8.2939453125, -6.99755859375, -5.701171875, -4.40478515625, -3.1083984375, -1.81201171875, -0.515625, 0.78076171875, 2.0771484375, 3.37353515625, 4.669921875, 5.96630859375, 7.2626953125, 8.55908203125, 9.85546875, 11.15185546875, 12.4482421875, 13.74462890625, 15.041015625, 16.33740234375, 17.6337890625, 18.93017578125, 20.2265625, 21.52294921875, 22.8193359375, 24.11572265625, 25.412109375, 26.70849609375, 28.0048828125, 29.30126953125, 30.59765625, 31.89404296875, 33.1904296875, 34.48681640625, 35.783203125, 37.07958984375, 38.3759765625, 39.67236328125, 40.96875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 13.0, 41.0, 118.0, 208.0, 242.0, 190.0, 123.0, 48.0, 17.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.137881755828857, -6.310557842254639, -5.48323392868042, -4.655909538269043, -3.8285858631134033, -3.0012617111206055, -2.1739377975463867, -1.346613883972168, -0.5192899703979492, 0.3080340027809143, 1.1353579759597778, 1.9626820087432861, 2.790005922317505, 3.6173300743103027, 4.4446539878845215, 5.27197790145874, 6.099301815032959, 6.926625728607178, 7.7539496421813965, 8.581274032592773, 9.408597946166992, 10.235921859741211, 11.06324577331543, 11.890569686889648, 12.717893600463867, 13.545217514038086, 14.372541427612305, 15.199865341186523, 16.027189254760742, 16.85451316833496, 17.68183708190918, 18.5091609954834, 19.336484909057617, 20.163808822631836, 20.991132736206055, 21.818456649780273, 22.645780563354492, 23.47310447692871, 24.30042839050293, 25.12775230407715, 25.955076217651367, 26.782400131225586, 27.609724044799805, 28.437047958374023, 29.264371871948242, 30.09169578552246, 30.91901969909668, 31.7463436126709, 32.57366943359375, 33.40099334716797, 34.22831726074219, 35.055641174316406, 35.882965087890625, 36.710289001464844, 37.53761291503906, 38.36493682861328, 39.1922607421875, 40.01958465576172, 40.84690856933594, 41.674232482910156, 42.501556396484375, 43.328880310058594, 44.15620422363281, 44.98352813720703, 45.81085205078125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 5.0, 7.0, 8.0, 13.0, 13.0, 22.0, 15.0, 13.0, 19.0, 29.0, 21.0, 33.0, 43.0, 41.0, 36.0, 23.0, 45.0, 46.0, 34.0, 46.0, 44.0, 41.0, 46.0, 23.0, 39.0, 42.0, 32.0, 28.0, 20.0, 37.0, 17.0, 13.0, 28.0, 13.0, 8.0, 6.0, 10.0, 5.0, 8.0, 7.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-27.100921630859375, -26.310359954833984, -25.51979637145996, -24.72923469543457, -23.93867301940918, -23.148109436035156, -22.357547760009766, -21.566986083984375, -20.776424407958984, -19.985862731933594, -19.19529914855957, -18.40473747253418, -17.61417579650879, -16.823612213134766, -16.033050537109375, -15.242488861083984, -14.451925277709961, -13.661362648010254, -12.870800971984863, -12.080238342285156, -11.289676666259766, -10.499114036560059, -9.708551406860352, -8.917989730834961, -8.127427101135254, -7.336864948272705, -6.546302795410156, -5.755740165710449, -4.9651780128479, -4.174615859985352, -3.3840532302856445, -2.5934910774230957, -1.8029308319091797, -1.0123685598373413, -0.22180628776550293, 0.568756103515625, 1.3593182563781738, 2.1498804092407227, 2.9404430389404297, 3.7310051918029785, 4.521567344665527, 5.312129497528076, 6.102691650390625, 6.893254280090332, 7.683816432952881, 8.47437858581543, 9.264941215515137, 10.055503845214844, 10.846065521240234, 11.636628150939941, 12.427189826965332, 13.217752456665039, 14.00831413269043, 14.798876762390137, 15.589439392089844, 16.380001068115234, 17.170562744140625, 17.961124420166016, 18.75168800354004, 19.54224967956543, 20.33281135559082, 21.123374938964844, 21.913936614990234, 22.704498291015625, 23.49506187438965]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 7.0, 5.0, 6.0, 3.0, 12.0, 13.0, 13.0, 11.0, 28.0, 12.0, 22.0, 25.0, 22.0, 31.0, 37.0, 41.0, 40.0, 35.0, 35.0, 43.0, 39.0, 41.0, 31.0, 28.0, 37.0, 28.0, 46.0, 44.0, 39.0, 27.0, 23.0, 24.0, 16.0, 21.0, 23.0, 12.0, 16.0, 12.0, 12.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-3.123046875, -3.029815673828125, -2.93658447265625, -2.843353271484375, -2.7501220703125, -2.656890869140625, -2.56365966796875, -2.470428466796875, -2.377197265625, -2.283966064453125, -2.19073486328125, -2.097503662109375, -2.0042724609375, -1.911041259765625, -1.81781005859375, -1.724578857421875, -1.63134765625, -1.538116455078125, -1.44488525390625, -1.351654052734375, -1.2584228515625, -1.165191650390625, -1.07196044921875, -0.978729248046875, -0.885498046875, -0.792266845703125, -0.69903564453125, -0.605804443359375, -0.5125732421875, -0.419342041015625, -0.32611083984375, -0.232879638671875, -0.1396484375, -0.046417236328125, 0.04681396484375, 0.140045166015625, 0.2332763671875, 0.326507568359375, 0.41973876953125, 0.512969970703125, 0.606201171875, 0.699432373046875, 0.79266357421875, 0.885894775390625, 0.9791259765625, 1.072357177734375, 1.16558837890625, 1.258819580078125, 1.35205078125, 1.445281982421875, 1.53851318359375, 1.631744384765625, 1.7249755859375, 1.818206787109375, 1.91143798828125, 2.004669189453125, 2.097900390625, 2.191131591796875, 2.28436279296875, 2.377593994140625, 2.4708251953125, 2.564056396484375, 2.65728759765625, 2.750518798828125, 2.84375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 7.0, 4.0, 7.0, 18.0, 23.0, 21.0, 29.0, 21.0, 36.0, 51.0, 58.0, 106.0, 170.0, 255.0, 532.0, 1443.0, 8758.0, 139346.0, 1511165.0, 2182001.0, 326525.0, 19234.0, 2549.0, 783.0, 380.0, 214.0, 149.0, 88.0, 65.0, 52.0, 40.0, 23.0, 12.0, 15.0, 12.0, 14.0, 13.0, 8.0, 11.0, 3.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-7.28515625, -7.07183837890625, -6.8585205078125, -6.64520263671875, -6.431884765625, -6.21856689453125, -6.0052490234375, -5.79193115234375, -5.57861328125, -5.36529541015625, -5.1519775390625, -4.93865966796875, -4.725341796875, -4.51202392578125, -4.2987060546875, -4.08538818359375, -3.8720703125, -3.65875244140625, -3.4454345703125, -3.23211669921875, -3.018798828125, -2.80548095703125, -2.5921630859375, -2.37884521484375, -2.16552734375, -1.95220947265625, -1.7388916015625, -1.52557373046875, -1.312255859375, -1.09893798828125, -0.8856201171875, -0.67230224609375, -0.458984375, -0.24566650390625, -0.0323486328125, 0.18096923828125, 0.394287109375, 0.60760498046875, 0.8209228515625, 1.03424072265625, 1.24755859375, 1.46087646484375, 1.6741943359375, 1.88751220703125, 2.100830078125, 2.31414794921875, 2.5274658203125, 2.74078369140625, 2.9541015625, 3.16741943359375, 3.3807373046875, 3.59405517578125, 3.807373046875, 4.02069091796875, 4.2340087890625, 4.44732666015625, 4.66064453125, 4.87396240234375, 5.0872802734375, 5.30059814453125, 5.513916015625, 5.72723388671875, 5.9405517578125, 6.15386962890625, 6.3671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 9.0, 8.0, 24.0, 30.0, 39.0, 36.0, 57.0, 85.0, 115.0, 142.0, 226.0, 269.0, 348.0, 421.0, 443.0, 383.0, 369.0, 262.0, 207.0, 177.0, 114.0, 86.0, 57.0, 43.0, 39.0, 18.0, 16.0, 14.0, 8.0, 13.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.17108154296875, -5.9749755859375, -5.77886962890625, -5.582763671875, -5.38665771484375, -5.1905517578125, -4.99444580078125, -4.79833984375, -4.60223388671875, -4.4061279296875, -4.21002197265625, -4.013916015625, -3.81781005859375, -3.6217041015625, -3.42559814453125, -3.2294921875, -3.03338623046875, -2.8372802734375, -2.64117431640625, -2.445068359375, -2.24896240234375, -2.0528564453125, -1.85675048828125, -1.66064453125, -1.46453857421875, -1.2684326171875, -1.07232666015625, -0.876220703125, -0.68011474609375, -0.4840087890625, -0.28790283203125, -0.091796875, 0.10430908203125, 0.3004150390625, 0.49652099609375, 0.692626953125, 0.88873291015625, 1.0848388671875, 1.28094482421875, 1.47705078125, 1.67315673828125, 1.8692626953125, 2.06536865234375, 2.261474609375, 2.45758056640625, 2.6536865234375, 2.84979248046875, 3.0458984375, 3.24200439453125, 3.4381103515625, 3.63421630859375, 3.830322265625, 4.02642822265625, 4.2225341796875, 4.41864013671875, 4.61474609375, 4.81085205078125, 5.0069580078125, 5.20306396484375, 5.399169921875, 5.59527587890625, 5.7913818359375, 5.98748779296875, 6.18359375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 11.0, 12.0, 16.0, 21.0, 20.0, 44.0, 69.0, 74.0, 124.0, 127.0, 238.0, 297.0, 413.0, 866.0, 21210.0, 3509198.0, 656434.0, 3275.0, 536.0, 372.0, 268.0, 164.0, 140.0, 95.0, 54.0, 58.0, 47.0, 29.0, 25.0, 10.0, 10.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.015625, -21.34423828125, -20.6728515625, -20.00146484375, -19.330078125, -18.65869140625, -17.9873046875, -17.31591796875, -16.64453125, -15.97314453125, -15.3017578125, -14.63037109375, -13.958984375, -13.28759765625, -12.6162109375, -11.94482421875, -11.2734375, -10.60205078125, -9.9306640625, -9.25927734375, -8.587890625, -7.91650390625, -7.2451171875, -6.57373046875, -5.90234375, -5.23095703125, -4.5595703125, -3.88818359375, -3.216796875, -2.54541015625, -1.8740234375, -1.20263671875, -0.53125, 0.14013671875, 0.8115234375, 1.48291015625, 2.154296875, 2.82568359375, 3.4970703125, 4.16845703125, 4.83984375, 5.51123046875, 6.1826171875, 6.85400390625, 7.525390625, 8.19677734375, 8.8681640625, 9.53955078125, 10.2109375, 10.88232421875, 11.5537109375, 12.22509765625, 12.896484375, 13.56787109375, 14.2392578125, 14.91064453125, 15.58203125, 16.25341796875, 16.9248046875, 17.59619140625, 18.267578125, 18.93896484375, 19.6103515625, 20.28173828125, 20.953125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 7.0, 20.0, 31.0, 55.0, 58.0, 81.0, 90.0, 117.0, 104.0, 96.0, 96.0, 68.0, 52.0, 44.0, 32.0, 21.0, 15.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.229339599609375, -29.47683334350586, -28.724327087402344, -27.971820831298828, -27.219314575195312, -26.466808319091797, -25.71430206298828, -24.961795806884766, -24.20928955078125, -23.456783294677734, -22.70427703857422, -21.951770782470703, -21.199264526367188, -20.446758270263672, -19.694252014160156, -18.94174575805664, -18.189241409301758, -17.436735153198242, -16.684228897094727, -15.931722640991211, -15.179216384887695, -14.42671012878418, -13.67420482635498, -12.921698570251465, -12.16919231414795, -11.416686058044434, -10.664179801940918, -9.911674499511719, -9.159168243408203, -8.406661987304688, -7.654155731201172, -6.901649475097656, -6.149145126342773, -5.396638870239258, -4.644132614135742, -3.8916268348693848, -3.139120578765869, -2.3866143226623535, -1.634108543395996, -0.8816022872924805, -0.12909603118896484, 0.6234101057052612, 1.3759162425994873, 2.128422260284424, 2.8809285163879395, 3.633434772491455, 4.3859405517578125, 5.138446807861328, 5.890953063964844, 6.643459320068359, 7.395965576171875, 8.14847183227539, 8.900978088378906, 9.653484344482422, 10.405989646911621, 11.158495903015137, 11.911002159118652, 12.663508415222168, 13.416014671325684, 14.168519973754883, 14.921026229858398, 15.673532485961914, 16.42603874206543, 17.178544998168945, 17.93105125427246]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 1.0, 6.0, 9.0, 8.0, 9.0, 14.0, 8.0, 32.0, 15.0, 21.0, 32.0, 17.0, 44.0, 29.0, 34.0, 43.0, 42.0, 49.0, 47.0, 39.0, 46.0, 50.0, 47.0, 55.0, 44.0, 36.0, 45.0, 30.0, 32.0, 19.0, 22.0, 18.0, 11.0, 12.0, 12.0, 11.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.076969146728516, -20.358362197875977, -19.639753341674805, -18.921146392822266, -18.202539443969727, -17.483930587768555, -16.765323638916016, -16.046714782714844, -15.328107833862305, -14.60949993133545, -13.89089298248291, -13.172285079956055, -12.4536771774292, -11.735069274902344, -11.016462326049805, -10.29785442352295, -9.57924747467041, -8.860639572143555, -8.142032623291016, -7.42342472076416, -6.704816818237305, -5.986209392547607, -5.26760196685791, -4.548994064331055, -3.8303866386413574, -3.111778974533081, -2.3931713104248047, -1.6745638847351074, -0.955956220626831, -0.2373485565185547, 0.4812588691711426, 1.199866771697998, 1.9184741973876953, 2.6370818614959717, 3.355689525604248, 4.074296951293945, 4.792904853820801, 5.511512279510498, 6.230119705200195, 6.948727607727051, 7.667335033416748, 8.385942459106445, 9.1045503616333, 9.823158264160156, 10.541765213012695, 11.26037311553955, 11.978981018066406, 12.697587966918945, 13.4161958694458, 14.134803771972656, 14.853410720825195, 15.57201862335205, 16.290626525878906, 17.009233474731445, 17.727840423583984, 18.446449279785156, 19.165056228637695, 19.883663177490234, 20.602272033691406, 21.320878982543945, 22.039485931396484, 22.758094787597656, 23.476701736450195, 24.195308685302734, 24.913917541503906]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 10.0, 11.0, 14.0, 14.0, 15.0, 27.0, 16.0, 16.0, 19.0, 34.0, 36.0, 24.0, 28.0, 44.0, 37.0, 45.0, 34.0, 37.0, 33.0, 43.0, 38.0, 39.0, 37.0, 38.0, 36.0, 29.0, 36.0, 29.0, 20.0, 16.0, 19.0, 18.0, 24.0, 17.0, 11.0, 7.0, 7.0, 14.0, 6.0, 3.0, 4.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.76177978515625, -2.6719970703125, -2.58221435546875, -2.492431640625, -2.40264892578125, -2.3128662109375, -2.22308349609375, -2.13330078125, -2.04351806640625, -1.9537353515625, -1.86395263671875, -1.774169921875, -1.68438720703125, -1.5946044921875, -1.50482177734375, -1.4150390625, -1.32525634765625, -1.2354736328125, -1.14569091796875, -1.055908203125, -0.96612548828125, -0.8763427734375, -0.78656005859375, -0.69677734375, -0.60699462890625, -0.5172119140625, -0.42742919921875, -0.337646484375, -0.24786376953125, -0.1580810546875, -0.06829833984375, 0.021484375, 0.11126708984375, 0.2010498046875, 0.29083251953125, 0.380615234375, 0.47039794921875, 0.5601806640625, 0.64996337890625, 0.73974609375, 0.82952880859375, 0.9193115234375, 1.00909423828125, 1.098876953125, 1.18865966796875, 1.2784423828125, 1.36822509765625, 1.4580078125, 1.54779052734375, 1.6375732421875, 1.72735595703125, 1.817138671875, 1.90692138671875, 1.9967041015625, 2.08648681640625, 2.17626953125, 2.26605224609375, 2.3558349609375, 2.44561767578125, 2.535400390625, 2.62518310546875, 2.7149658203125, 2.80474853515625, 2.89453125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 7.0, 14.0, 16.0, 30.0, 44.0, 53.0, 98.0, 99.0, 148.0, 247.0, 402.0, 548.0, 801.0, 1231.0, 1728.0, 2577.0, 3838.0, 5766.0, 8419.0, 12789.0, 18863.0, 29283.0, 45331.0, 74132.0, 137112.0, 275459.0, 180946.0, 92373.0, 54390.0, 34463.0, 22068.0, 14924.0, 9909.0, 6700.0, 4504.0, 2926.0, 2073.0, 1419.0, 908.0, 581.0, 429.0, 307.0, 188.0, 119.0, 93.0, 72.0, 46.0, 29.0, 16.0, 18.0, 4.0, 10.0, 4.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.5205078125, -0.5045852661132812, -0.4886627197265625, -0.47274017333984375, -0.456817626953125, -0.44089508056640625, -0.4249725341796875, -0.40904998779296875, -0.39312744140625, -0.37720489501953125, -0.3612823486328125, -0.34535980224609375, -0.329437255859375, -0.31351470947265625, -0.2975921630859375, -0.28166961669921875, -0.2657470703125, -0.24982452392578125, -0.2339019775390625, -0.21797943115234375, -0.202056884765625, -0.18613433837890625, -0.1702117919921875, -0.15428924560546875, -0.13836669921875, -0.12244415283203125, -0.1065216064453125, -0.09059906005859375, -0.074676513671875, -0.05875396728515625, -0.0428314208984375, -0.02690887451171875, -0.010986328125, 0.00493621826171875, 0.0208587646484375, 0.03678131103515625, 0.052703857421875, 0.06862640380859375, 0.0845489501953125, 0.10047149658203125, 0.11639404296875, 0.13231658935546875, 0.1482391357421875, 0.16416168212890625, 0.180084228515625, 0.19600677490234375, 0.2119293212890625, 0.22785186767578125, 0.2437744140625, 0.25969696044921875, 0.2756195068359375, 0.29154205322265625, 0.307464599609375, 0.32338714599609375, 0.3393096923828125, 0.35523223876953125, 0.37115478515625, 0.38707733154296875, 0.4029998779296875, 0.41892242431640625, 0.434844970703125, 0.45076751708984375, 0.4666900634765625, 0.48261260986328125, 0.49853515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 8.0, 7.0, 10.0, 11.0, 7.0, 8.0, 13.0, 14.0, 17.0, 13.0, 14.0, 29.0, 27.0, 24.0, 29.0, 32.0, 41.0, 33.0, 47.0, 37.0, 37.0, 1062.0, 38.0, 37.0, 26.0, 37.0, 33.0, 26.0, 22.0, 27.0, 26.0, 33.0, 29.0, 31.0, 23.0, 16.0, 14.0, 12.0, 12.0, 14.0, 12.0, 5.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-1.935546875, -1.88006591796875, -1.8245849609375, -1.76910400390625, -1.713623046875, -1.65814208984375, -1.6026611328125, -1.54718017578125, -1.49169921875, -1.43621826171875, -1.3807373046875, -1.32525634765625, -1.269775390625, -1.21429443359375, -1.1588134765625, -1.10333251953125, -1.0478515625, -0.99237060546875, -0.9368896484375, -0.88140869140625, -0.825927734375, -0.77044677734375, -0.7149658203125, -0.65948486328125, -0.60400390625, -0.54852294921875, -0.4930419921875, -0.43756103515625, -0.382080078125, -0.32659912109375, -0.2711181640625, -0.21563720703125, -0.16015625, -0.10467529296875, -0.0491943359375, 0.00628662109375, 0.061767578125, 0.11724853515625, 0.1727294921875, 0.22821044921875, 0.28369140625, 0.33917236328125, 0.3946533203125, 0.45013427734375, 0.505615234375, 0.56109619140625, 0.6165771484375, 0.67205810546875, 0.7275390625, 0.78302001953125, 0.8385009765625, 0.89398193359375, 0.949462890625, 1.00494384765625, 1.0604248046875, 1.11590576171875, 1.17138671875, 1.22686767578125, 1.2823486328125, 1.33782958984375, 1.393310546875, 1.44879150390625, 1.5042724609375, 1.55975341796875, 1.615234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 10.0, 24.0, 24.0, 44.0, 40.0, 85.0, 143.0, 154.0, 252.0, 356.0, 612.0, 849.0, 1191.0, 1718.0, 2544.0, 3881.0, 5571.0, 8686.0, 13032.0, 20271.0, 31704.0, 51076.0, 87654.0, 173704.0, 1342331.0, 146130.0, 77403.0, 45662.0, 27971.0, 18045.0, 11778.0, 7834.0, 5150.0, 3529.0, 2454.0, 1694.0, 1125.0, 784.0, 521.0, 382.0, 211.0, 183.0, 117.0, 75.0, 44.0, 25.0, 21.0, 15.0, 7.0, 10.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5243377685546875, -0.508148193359375, -0.4919586181640625, -0.47576904296875, -0.4595794677734375, -0.443389892578125, -0.4272003173828125, -0.4110107421875, -0.3948211669921875, -0.378631591796875, -0.3624420166015625, -0.34625244140625, -0.3300628662109375, -0.313873291015625, -0.2976837158203125, -0.281494140625, -0.2653045654296875, -0.249114990234375, -0.2329254150390625, -0.21673583984375, -0.2005462646484375, -0.184356689453125, -0.1681671142578125, -0.1519775390625, -0.1357879638671875, -0.119598388671875, -0.1034088134765625, -0.08721923828125, -0.0710296630859375, -0.054840087890625, -0.0386505126953125, -0.0224609375, -0.0062713623046875, 0.009918212890625, 0.0261077880859375, 0.04229736328125, 0.0584869384765625, 0.074676513671875, 0.0908660888671875, 0.1070556640625, 0.1232452392578125, 0.139434814453125, 0.1556243896484375, 0.17181396484375, 0.1880035400390625, 0.204193115234375, 0.2203826904296875, 0.236572265625, 0.2527618408203125, 0.268951416015625, 0.2851409912109375, 0.30133056640625, 0.3175201416015625, 0.333709716796875, 0.3498992919921875, 0.3660888671875, 0.3822784423828125, 0.398468017578125, 0.4146575927734375, 0.43084716796875, 0.4470367431640625, 0.463226318359375, 0.4794158935546875, 0.49560546875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 3.0, 10.0, 12.0, 10.0, 20.0, 14.0, 23.0, 22.0, 33.0, 26.0, 30.0, 58.0, 60.0, 67.0, 66.0, 75.0, 69.0, 65.0, 51.0, 41.0, 49.0, 30.0, 23.0, 21.0, 19.0, 18.0, 13.0, 7.0, 12.0, 6.0, 4.0, 4.0, 4.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037384033203125, -0.00036083534359931946, -0.0003478303551673889, -0.0003348253667354584, -0.00032182037830352783, -0.0003088153898715973, -0.00029581040143966675, -0.0002828054130077362, -0.00026980042457580566, -0.0002567954361438751, -0.00024379044771194458, -0.00023078545928001404, -0.0002177804708480835, -0.00020477548241615295, -0.0001917704939842224, -0.00017876550555229187, -0.00016576051712036133, -0.00015275552868843079, -0.00013975054025650024, -0.0001267455518245697, -0.00011374056339263916, -0.00010073557496070862, -8.773058652877808e-05, -7.472559809684753e-05, -6.172060966491699e-05, -4.871562123298645e-05, -3.571063280105591e-05, -2.2705644369125366e-05, -9.700655937194824e-06, 3.3043324947357178e-06, 1.630932092666626e-05, 2.9314309358596802e-05, 4.2319297790527344e-05, 5.5324286222457886e-05, 6.832927465438843e-05, 8.133426308631897e-05, 9.433925151824951e-05, 0.00010734423995018005, 0.0001203492283821106, 0.00013335421681404114, 0.00014635920524597168, 0.00015936419367790222, 0.00017236918210983276, 0.0001853741705417633, 0.00019837915897369385, 0.0002113841474056244, 0.00022438913583755493, 0.00023739412426948547, 0.000250399112701416, 0.00026340410113334656, 0.0002764090895652771, 0.00028941407799720764, 0.0003024190664291382, 0.0003154240548610687, 0.00032842904329299927, 0.0003414340317249298, 0.00035443902015686035, 0.0003674440085887909, 0.00038044899702072144, 0.000393453985452652, 0.0004064589738845825, 0.00041946396231651306, 0.0004324689507484436, 0.00044547393918037415, 0.0004584789276123047]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 6.0, 4.0, 8.0, 8.0, 9.0, 13.0, 18.0, 15.0, 21.0, 26.0, 29.0, 37.0, 62.0, 83.0, 135.0, 216.0, 405.0, 950.0, 131347.0, 912327.0, 1452.0, 549.0, 251.0, 159.0, 80.0, 73.0, 56.0, 55.0, 27.0, 24.0, 23.0, 16.0, 16.0, 12.0, 10.0, 4.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00946807861328125, -0.009198606014251709, -0.008929133415222168, -0.008659660816192627, -0.008390188217163086, -0.008120715618133545, -0.007851243019104004, -0.007581770420074463, -0.007312297821044922, -0.007042825222015381, -0.00677335262298584, -0.006503880023956299, -0.006234407424926758, -0.005964934825897217, -0.005695462226867676, -0.005425989627838135, -0.005156517028808594, -0.004887044429779053, -0.004617571830749512, -0.004348099231719971, -0.00407862663269043, -0.0038091540336608887, -0.0035396814346313477, -0.0032702088356018066, -0.0030007362365722656, -0.0027312636375427246, -0.0024617910385131836, -0.0021923184394836426, -0.0019228458404541016, -0.0016533732414245605, -0.0013839006423950195, -0.0011144280433654785, -0.0008449554443359375, -0.0005754828453063965, -0.00030601024627685547, -3.653764724731445e-05, 0.00023293495178222656, 0.0005024075508117676, 0.0007718801498413086, 0.0010413527488708496, 0.0013108253479003906, 0.0015802979469299316, 0.0018497705459594727, 0.0021192431449890137, 0.0023887157440185547, 0.0026581883430480957, 0.0029276609420776367, 0.0031971335411071777, 0.0034666061401367188, 0.0037360787391662598, 0.004005551338195801, 0.004275023937225342, 0.004544496536254883, 0.004813969135284424, 0.005083441734313965, 0.005352914333343506, 0.005622386932373047, 0.005891859531402588, 0.006161332130432129, 0.00643080472946167, 0.006700277328491211, 0.006969749927520752, 0.007239222526550293, 0.007508695125579834, 0.007778167724609375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 54.0, 660.0, 297.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010406688088551164, -0.0009949058294296265, -0.0009491429664194584, -0.0009033800452016294, -0.0008576171239838004, -0.0008118542027659714, -0.0007660912815481424, -0.0007203283603303134, -0.0006745654391124845, -0.0006288025178946555, -0.0005830395966768265, -0.0005372766754589975, -0.0004915137542411685, -0.0004457508330233395, -0.0003999879118055105, -0.00035422499058768153, -0.00030846206936985254, -0.00026269914815202355, -0.00021693622693419456, -0.00017117330571636558, -0.0001254103844985366, -7.96474632807076e-05, -3.388454206287861e-05, 1.187837915495038e-05, 5.764130037277937e-05, 0.00010340422159060836, 0.00014916714280843735, 0.00019493006402626634, 0.00024069298524409533, 0.0002864559064619243, 0.0003322188276797533, 0.0003779817488975823, 0.0004237447865307331, 0.0004695077077485621, 0.0005152706289663911, 0.0005610335501842201, 0.0006067964714020491, 0.000652559392619878, 0.000698322313837707, 0.000744085235055536, 0.000789848156273365, 0.000835611077491194, 0.000881373998709023, 0.000927136919926852, 0.000972899841144681, 0.001018662704154849, 0.001064425683580339, 0.0011101886630058289, 0.001155951526015997, 0.001201714389026165, 0.001247477368451655, 0.0012932403478771448, 0.0013390032108873129, 0.001384766073897481, 0.0014305290533229709, 0.0014762920327484608, 0.0015220548957586288, 0.001567817758768797, 0.0016135807381942868, 0.0016593437176197767, 0.0017051065806299448, 0.0017508694436401129, 0.0017966324230656028, 0.0018423954024910927, 0.0018881582655012608]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 9.0, 4.0, 5.0, 12.0, 14.0, 15.0, 21.0, 17.0, 20.0, 22.0, 24.0, 20.0, 36.0, 39.0, 36.0, 27.0, 29.0, 31.0, 31.0, 36.0, 33.0, 45.0, 41.0, 41.0, 30.0, 26.0, 32.0, 33.0, 32.0, 28.0, 19.0, 23.0, 24.0, 14.0, 21.0, 15.0, 12.0, 15.0, 15.0, 4.0, 10.0, 5.0, 5.0, 3.0, 4.0, 6.0, 1.0, 3.0, 2.0, 5.0, 3.0], "bins": [-0.0001995563507080078, -0.00019373930990695953, -0.00018792226910591125, -0.00018210522830486298, -0.0001762881875038147, -0.00017047114670276642, -0.00016465410590171814, -0.00015883706510066986, -0.00015302002429962158, -0.0001472029834985733, -0.00014138594269752502, -0.00013556890189647675, -0.00012975186109542847, -0.0001239348202943802, -0.00011811777949333191, -0.00011230073869228363, -0.00010648369789123535, -0.00010066665709018707, -9.48496162891388e-05, -8.903257548809052e-05, -8.321553468704224e-05, -7.739849388599396e-05, -7.158145308494568e-05, -6.57644122838974e-05, -5.994737148284912e-05, -5.413033068180084e-05, -4.8313289880752563e-05, -4.2496249079704285e-05, -3.6679208278656006e-05, -3.086216747760773e-05, -2.5045126676559448e-05, -1.922808587551117e-05, -1.341104507446289e-05, -7.594004273414612e-06, -1.776963472366333e-06, 4.040077328681946e-06, 9.857118129730225e-06, 1.5674158930778503e-05, 2.1491199731826782e-05, 2.730824053287506e-05, 3.312528133392334e-05, 3.894232213497162e-05, 4.47593629360199e-05, 5.0576403737068176e-05, 5.6393444538116455e-05, 6.221048533916473e-05, 6.802752614021301e-05, 7.384456694126129e-05, 7.966160774230957e-05, 8.547864854335785e-05, 9.129568934440613e-05, 9.71127301454544e-05, 0.00010292977094650269, 0.00010874681174755096, 0.00011456385254859924, 0.00012038089334964752, 0.0001261979341506958, 0.00013201497495174408, 0.00013783201575279236, 0.00014364905655384064, 0.00014946609735488892, 0.0001552831381559372, 0.00016110017895698547, 0.00016691721975803375, 0.00017273426055908203]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 10.0, 11.0, 14.0, 14.0, 15.0, 27.0, 16.0, 16.0, 19.0, 34.0, 36.0, 24.0, 28.0, 44.0, 38.0, 44.0, 34.0, 37.0, 33.0, 42.0, 39.0, 39.0, 37.0, 38.0, 36.0, 29.0, 36.0, 29.0, 20.0, 16.0, 19.0, 18.0, 24.0, 17.0, 11.0, 7.0, 7.0, 14.0, 6.0, 3.0, 4.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.76177978515625, -2.6719970703125, -2.58221435546875, -2.492431640625, -2.40264892578125, -2.3128662109375, -2.22308349609375, -2.13330078125, -2.04351806640625, -1.9537353515625, -1.86395263671875, -1.774169921875, -1.68438720703125, -1.5946044921875, -1.50482177734375, -1.4150390625, -1.32525634765625, -1.2354736328125, -1.14569091796875, -1.055908203125, -0.96612548828125, -0.8763427734375, -0.78656005859375, -0.69677734375, -0.60699462890625, -0.5172119140625, -0.42742919921875, -0.337646484375, -0.24786376953125, -0.1580810546875, -0.06829833984375, 0.021484375, 0.11126708984375, 0.2010498046875, 0.29083251953125, 0.380615234375, 0.47039794921875, 0.5601806640625, 0.64996337890625, 0.73974609375, 0.82952880859375, 0.9193115234375, 1.00909423828125, 1.098876953125, 1.18865966796875, 1.2784423828125, 1.36822509765625, 1.4580078125, 1.54779052734375, 1.6375732421875, 1.72735595703125, 1.817138671875, 1.90692138671875, 1.9967041015625, 2.08648681640625, 2.17626953125, 2.26605224609375, 2.3558349609375, 2.44561767578125, 2.535400390625, 2.62518310546875, 2.7149658203125, 2.80474853515625, 2.89453125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 1.0, 9.0, 14.0, 13.0, 24.0, 24.0, 47.0, 51.0, 67.0, 103.0, 102.0, 177.0, 245.0, 401.0, 705.0, 1328.0, 2677.0, 5535.0, 13060.0, 30777.0, 74208.0, 171382.0, 373984.0, 212173.0, 92397.0, 38601.0, 16359.0, 7071.0, 3228.0, 1583.0, 815.0, 423.0, 269.0, 170.0, 119.0, 115.0, 82.0, 58.0, 37.0, 31.0, 21.0, 22.0, 11.0, 7.0, 9.0, 6.0, 8.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.751953125, -2.664947509765625, -2.57794189453125, -2.490936279296875, -2.4039306640625, -2.316925048828125, -2.22991943359375, -2.142913818359375, -2.055908203125, -1.968902587890625, -1.88189697265625, -1.794891357421875, -1.7078857421875, -1.620880126953125, -1.53387451171875, -1.446868896484375, -1.35986328125, -1.272857666015625, -1.18585205078125, -1.098846435546875, -1.0118408203125, -0.924835205078125, -0.83782958984375, -0.750823974609375, -0.663818359375, -0.576812744140625, -0.48980712890625, -0.402801513671875, -0.3157958984375, -0.228790283203125, -0.14178466796875, -0.054779052734375, 0.0322265625, 0.119232177734375, 0.20623779296875, 0.293243408203125, 0.3802490234375, 0.467254638671875, 0.55426025390625, 0.641265869140625, 0.728271484375, 0.815277099609375, 0.90228271484375, 0.989288330078125, 1.0762939453125, 1.163299560546875, 1.25030517578125, 1.337310791015625, 1.42431640625, 1.511322021484375, 1.59832763671875, 1.685333251953125, 1.7723388671875, 1.859344482421875, 1.94635009765625, 2.033355712890625, 2.120361328125, 2.207366943359375, 2.29437255859375, 2.381378173828125, 2.4683837890625, 2.555389404296875, 2.64239501953125, 2.729400634765625, 2.81640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 3.0, 10.0, 7.0, 8.0, 13.0, 12.0, 16.0, 15.0, 21.0, 29.0, 18.0, 32.0, 35.0, 38.0, 44.0, 43.0, 56.0, 99.0, 234.0, 1512.0, 283.0, 76.0, 60.0, 53.0, 40.0, 27.0, 25.0, 37.0, 27.0, 22.0, 25.0, 23.0, 14.0, 11.0, 9.0, 15.0, 7.0, 10.0, 3.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.3671875, -10.028076171875, -9.68896484375, -9.349853515625, -9.0107421875, -8.671630859375, -8.33251953125, -7.993408203125, -7.654296875, -7.315185546875, -6.97607421875, -6.636962890625, -6.2978515625, -5.958740234375, -5.61962890625, -5.280517578125, -4.94140625, -4.602294921875, -4.26318359375, -3.924072265625, -3.5849609375, -3.245849609375, -2.90673828125, -2.567626953125, -2.228515625, -1.889404296875, -1.55029296875, -1.211181640625, -0.8720703125, -0.532958984375, -0.19384765625, 0.145263671875, 0.484375, 0.823486328125, 1.16259765625, 1.501708984375, 1.8408203125, 2.179931640625, 2.51904296875, 2.858154296875, 3.197265625, 3.536376953125, 3.87548828125, 4.214599609375, 4.5537109375, 4.892822265625, 5.23193359375, 5.571044921875, 5.91015625, 6.249267578125, 6.58837890625, 6.927490234375, 7.2666015625, 7.605712890625, 7.94482421875, 8.283935546875, 8.623046875, 8.962158203125, 9.30126953125, 9.640380859375, 9.9794921875, 10.318603515625, 10.65771484375, 10.996826171875, 11.3359375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 15.0, 12.0, 16.0, 25.0, 33.0, 49.0, 74.0, 124.0, 179.0, 381.0, 1402.0, 1727101.0, 1413984.0, 1332.0, 403.0, 204.0, 104.0, 80.0, 48.0, 41.0, 33.0, 19.0, 11.0, 8.0, 8.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.5, -69.5673828125, -67.634765625, -65.7021484375, -63.76953125, -61.8369140625, -59.904296875, -57.9716796875, -56.0390625, -54.1064453125, -52.173828125, -50.2412109375, -48.30859375, -46.3759765625, -44.443359375, -42.5107421875, -40.578125, -38.6455078125, -36.712890625, -34.7802734375, -32.84765625, -30.9150390625, -28.982421875, -27.0498046875, -25.1171875, -23.1845703125, -21.251953125, -19.3193359375, -17.38671875, -15.4541015625, -13.521484375, -11.5888671875, -9.65625, -7.7236328125, -5.791015625, -3.8583984375, -1.92578125, 0.0068359375, 1.939453125, 3.8720703125, 5.8046875, 7.7373046875, 9.669921875, 11.6025390625, 13.53515625, 15.4677734375, 17.400390625, 19.3330078125, 21.265625, 23.1982421875, 25.130859375, 27.0634765625, 28.99609375, 30.9287109375, 32.861328125, 34.7939453125, 36.7265625, 38.6591796875, 40.591796875, 42.5244140625, 44.45703125, 46.3896484375, 48.322265625, 50.2548828125, 52.1875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 38.0, 165.0, 292.0, 318.0, 149.0, 37.0, 9.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66176700592041, -5.574765682220459, -4.487764358520508, -3.4007625579833984, -2.3137612342834473, -1.226759910583496, -0.13975811004638672, 0.9472432136535645, 2.0342445373535156, 3.121245861053467, 4.208247184753418, 5.295248985290527, 6.3822503089904785, 7.46925163269043, 8.556253433227539, 9.643255233764648, 10.730256080627441, 11.81725788116455, 12.904258728027344, 13.991260528564453, 15.078262329101562, 16.165264129638672, 17.25226593017578, 18.339265823364258, 19.426267623901367, 20.513269424438477, 21.600271224975586, 22.687271118164062, 23.774272918701172, 24.86127471923828, 25.94827651977539, 27.0352783203125, 28.12228012084961, 29.20928192138672, 30.296283721923828, 31.383285522460938, 32.47028732299805, 33.557289123535156, 34.644287109375, 35.73128890991211, 36.81829071044922, 37.90529251098633, 38.99229431152344, 40.07929611206055, 41.166297912597656, 42.2532958984375, 43.340301513671875, 44.42729949951172, 45.514305114746094, 46.6013069152832, 47.68830871582031, 48.77531051635742, 49.86231231689453, 50.949310302734375, 52.03631591796875, 53.123313903808594, 54.2103157043457, 55.29731750488281, 56.38431930541992, 57.47132110595703, 58.55832290649414, 59.64532470703125, 60.732322692871094, 61.8193244934082, 62.90632629394531]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 3.0, 4.0, 5.0, 7.0, 8.0, 6.0, 7.0, 12.0, 15.0, 10.0, 28.0, 22.0, 20.0, 20.0, 26.0, 31.0, 33.0, 37.0, 34.0, 36.0, 41.0, 41.0, 47.0, 34.0, 43.0, 43.0, 39.0, 30.0, 24.0, 42.0, 38.0, 33.0, 31.0, 27.0, 23.0, 16.0, 15.0, 16.0, 14.0, 13.0, 10.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.7840576171875, -20.971065521240234, -20.1580753326416, -19.345083236694336, -18.532093048095703, -17.719100952148438, -16.906108856201172, -16.093116760253906, -15.280126571655273, -14.467135429382324, -13.654144287109375, -12.84115219116211, -12.02816104888916, -11.215169906616211, -10.402177810668945, -9.589186668395996, -8.776195526123047, -7.963204383850098, -7.15021276473999, -6.337221145629883, -5.524230003356934, -4.711238861083984, -3.898247241973877, -3.0852556228637695, -2.2722644805908203, -1.459273099899292, -0.6462817192077637, 0.16670966148376465, 0.979701042175293, 1.7926921844482422, 2.6056838035583496, 3.418675422668457, 4.231666564941406, 5.0446577072143555, 5.857649326324463, 6.67064094543457, 7.4836320877075195, 8.296623229980469, 9.109615325927734, 9.922606468200684, 10.735597610473633, 11.548588752746582, 12.361579895019531, 13.174571990966797, 13.987563133239746, 14.800554275512695, 15.613546371459961, 16.426536560058594, 17.23952865600586, 18.052520751953125, 18.865510940551758, 19.678503036499023, 20.491493225097656, 21.304485321044922, 22.117477416992188, 22.930469512939453, 23.743459701538086, 24.55645179748535, 25.369441986083984, 26.18243408203125, 26.995426177978516, 27.80841636657715, 28.621408462524414, 29.434398651123047, 30.247390747070312]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 11.0, 8.0, 11.0, 19.0, 7.0, 19.0, 22.0, 26.0, 16.0, 27.0, 28.0, 31.0, 27.0, 40.0, 32.0, 37.0, 32.0, 36.0, 39.0, 37.0, 42.0, 40.0, 36.0, 40.0, 35.0, 38.0, 38.0, 32.0, 23.0, 24.0, 22.0, 12.0, 14.0, 19.0, 13.0, 12.0, 8.0, 15.0, 11.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.116058349609375, -3.01727294921875, -2.918487548828125, -2.8197021484375, -2.720916748046875, -2.62213134765625, -2.523345947265625, -2.424560546875, -2.325775146484375, -2.22698974609375, -2.128204345703125, -2.0294189453125, -1.930633544921875, -1.83184814453125, -1.733062744140625, -1.63427734375, -1.535491943359375, -1.43670654296875, -1.337921142578125, -1.2391357421875, -1.140350341796875, -1.04156494140625, -0.942779541015625, -0.843994140625, -0.745208740234375, -0.64642333984375, -0.547637939453125, -0.4488525390625, -0.350067138671875, -0.25128173828125, -0.152496337890625, -0.0537109375, 0.045074462890625, 0.14385986328125, 0.242645263671875, 0.3414306640625, 0.440216064453125, 0.53900146484375, 0.637786865234375, 0.736572265625, 0.835357666015625, 0.93414306640625, 1.032928466796875, 1.1317138671875, 1.230499267578125, 1.32928466796875, 1.428070068359375, 1.52685546875, 1.625640869140625, 1.72442626953125, 1.823211669921875, 1.9219970703125, 2.020782470703125, 2.11956787109375, 2.218353271484375, 2.317138671875, 2.415924072265625, 2.51470947265625, 2.613494873046875, 2.7122802734375, 2.811065673828125, 2.90985107421875, 3.008636474609375, 3.107421875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 11.0, 14.0, 14.0, 24.0, 23.0, 39.0, 44.0, 44.0, 54.0, 63.0, 74.0, 94.0, 124.0, 167.0, 342.0, 699.0, 3017.0, 32336.0, 598964.0, 2567670.0, 927391.0, 56354.0, 4565.0, 926.0, 391.0, 199.0, 134.0, 100.0, 78.0, 35.0, 47.0, 38.0, 33.0, 27.0, 26.0, 26.0, 19.0, 19.0, 13.0, 8.0, 4.0, 11.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.515625, -7.2850341796875, -7.054443359375, -6.8238525390625, -6.59326171875, -6.3626708984375, -6.132080078125, -5.9014892578125, -5.6708984375, -5.4403076171875, -5.209716796875, -4.9791259765625, -4.74853515625, -4.5179443359375, -4.287353515625, -4.0567626953125, -3.826171875, -3.5955810546875, -3.364990234375, -3.1343994140625, -2.90380859375, -2.6732177734375, -2.442626953125, -2.2120361328125, -1.9814453125, -1.7508544921875, -1.520263671875, -1.2896728515625, -1.05908203125, -0.8284912109375, -0.597900390625, -0.3673095703125, -0.13671875, 0.0938720703125, 0.324462890625, 0.5550537109375, 0.78564453125, 1.0162353515625, 1.246826171875, 1.4774169921875, 1.7080078125, 1.9385986328125, 2.169189453125, 2.3997802734375, 2.63037109375, 2.8609619140625, 3.091552734375, 3.3221435546875, 3.552734375, 3.7833251953125, 4.013916015625, 4.2445068359375, 4.47509765625, 4.7056884765625, 4.936279296875, 5.1668701171875, 5.3974609375, 5.6280517578125, 5.858642578125, 6.0892333984375, 6.31982421875, 6.5504150390625, 6.781005859375, 7.0115966796875, 7.2421875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 5.0, 8.0, 12.0, 10.0, 18.0, 24.0, 29.0, 27.0, 58.0, 70.0, 71.0, 98.0, 157.0, 151.0, 193.0, 277.0, 299.0, 364.0, 384.0, 347.0, 311.0, 258.0, 183.0, 154.0, 127.0, 92.0, 73.0, 54.0, 41.0, 40.0, 26.0, 29.0, 16.0, 13.0, 8.0, 7.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-5.875, -5.70941162109375, -5.5438232421875, -5.37823486328125, -5.212646484375, -5.04705810546875, -4.8814697265625, -4.71588134765625, -4.55029296875, -4.38470458984375, -4.2191162109375, -4.05352783203125, -3.887939453125, -3.72235107421875, -3.5567626953125, -3.39117431640625, -3.2255859375, -3.05999755859375, -2.8944091796875, -2.72882080078125, -2.563232421875, -2.39764404296875, -2.2320556640625, -2.06646728515625, -1.90087890625, -1.73529052734375, -1.5697021484375, -1.40411376953125, -1.238525390625, -1.07293701171875, -0.9073486328125, -0.74176025390625, -0.576171875, -0.41058349609375, -0.2449951171875, -0.07940673828125, 0.086181640625, 0.25177001953125, 0.4173583984375, 0.58294677734375, 0.74853515625, 0.91412353515625, 1.0797119140625, 1.24530029296875, 1.410888671875, 1.57647705078125, 1.7420654296875, 1.90765380859375, 2.0732421875, 2.23883056640625, 2.4044189453125, 2.57000732421875, 2.735595703125, 2.90118408203125, 3.0667724609375, 3.23236083984375, 3.39794921875, 3.56353759765625, 3.7291259765625, 3.89471435546875, 4.060302734375, 4.22589111328125, 4.3914794921875, 4.55706787109375, 4.72265625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 7.0, 6.0, 9.0, 12.0, 13.0, 17.0, 24.0, 36.0, 42.0, 38.0, 63.0, 85.0, 111.0, 162.0, 239.0, 317.0, 459.0, 1483.0, 179444.0, 3979257.0, 30054.0, 878.0, 407.0, 255.0, 218.0, 150.0, 108.0, 97.0, 76.0, 59.0, 36.0, 22.0, 23.0, 20.0, 11.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.111083984375, -21.33154296875, -20.552001953125, -19.7724609375, -18.992919921875, -18.21337890625, -17.433837890625, -16.654296875, -15.874755859375, -15.09521484375, -14.315673828125, -13.5361328125, -12.756591796875, -11.97705078125, -11.197509765625, -10.41796875, -9.638427734375, -8.85888671875, -8.079345703125, -7.2998046875, -6.520263671875, -5.74072265625, -4.961181640625, -4.181640625, -3.402099609375, -2.62255859375, -1.843017578125, -1.0634765625, -0.283935546875, 0.49560546875, 1.275146484375, 2.0546875, 2.834228515625, 3.61376953125, 4.393310546875, 5.1728515625, 5.952392578125, 6.73193359375, 7.511474609375, 8.291015625, 9.070556640625, 9.85009765625, 10.629638671875, 11.4091796875, 12.188720703125, 12.96826171875, 13.747802734375, 14.52734375, 15.306884765625, 16.08642578125, 16.865966796875, 17.6455078125, 18.425048828125, 19.20458984375, 19.984130859375, 20.763671875, 21.543212890625, 22.32275390625, 23.102294921875, 23.8818359375, 24.661376953125, 25.44091796875, 26.220458984375, 27.0]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 48.0, 340.0, 448.0, 160.0, 13.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03895950317383, -29.493732452392578, -25.948505401611328, -22.403278350830078, -18.858051300048828, -15.312822341918945, -11.767595291137695, -8.222368240356445, -4.677141189575195, -1.1319139003753662, 2.413313388824463, 5.958540916442871, 9.503767967224121, 13.048995971679688, 16.594223022460938, 20.139450073242188, 23.684677124023438, 27.229904174804688, 30.775131225585938, 34.32035827636719, 37.86558532714844, 41.41081237792969, 44.95603942871094, 48.50126647949219, 52.04649353027344, 55.59172058105469, 59.13694763183594, 62.68217468261719, 66.22740173339844, 69.77262878417969, 73.31785583496094, 76.86308288574219, 80.40831756591797, 83.95354461669922, 87.49877166748047, 91.04399871826172, 94.58922576904297, 98.13445281982422, 101.67967987060547, 105.22490692138672, 108.77013397216797, 112.31536102294922, 115.86058807373047, 119.40581512451172, 122.95104217529297, 126.49626922607422, 130.04150390625, 133.58673095703125, 137.1319580078125, 140.67718505859375, 144.222412109375, 147.76763916015625, 151.3128662109375, 154.85809326171875, 158.4033203125, 161.94854736328125, 165.4937744140625, 169.03900146484375, 172.584228515625, 176.12945556640625, 179.6746826171875, 183.21990966796875, 186.76513671875, 190.31036376953125, 193.8555908203125]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 10.0, 14.0, 12.0, 21.0, 21.0, 18.0, 29.0, 16.0, 18.0, 37.0, 27.0, 27.0, 29.0, 45.0, 43.0, 43.0, 42.0, 38.0, 49.0, 40.0, 47.0, 39.0, 32.0, 38.0, 37.0, 23.0, 28.0, 25.0, 20.0, 18.0, 16.0, 14.0, 15.0, 12.0, 10.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.97812271118164, -20.312986373901367, -19.647851943969727, -18.982715606689453, -18.31757926940918, -17.65244483947754, -16.987308502197266, -16.322174072265625, -15.657037734985352, -14.991902351379395, -14.326766014099121, -13.661630630493164, -12.996495246887207, -12.33135986328125, -11.666223526000977, -11.00108814239502, -10.335951805114746, -9.670816421508789, -9.005680084228516, -8.340544700622559, -7.675409317016602, -7.010273456573486, -6.345137596130371, -5.680002212524414, -5.014866352081299, -4.349730491638184, -3.6845951080322266, -3.0194592475891113, -2.354323625564575, -1.689188003540039, -1.0240521430969238, -0.3589167594909668, 0.30621910095214844, 0.9713547825813293, 1.6364904642105103, 2.301626205444336, 2.966761827468872, 3.631897449493408, 4.297033309936523, 4.9621686935424805, 5.627304553985596, 6.292440414428711, 6.957575798034668, 7.622711658477783, 8.287847518920898, 8.952982902526855, 9.618118286132812, 10.283254623413086, 10.948390007019043, 11.613525390625, 12.278661727905273, 12.94379711151123, 13.608932495117188, 14.274068832397461, 14.939204216003418, 15.604339599609375, 16.26947593688965, 16.934612274169922, 17.599746704101562, 18.264883041381836, 18.93001937866211, 19.59515380859375, 20.260290145874023, 20.925426483154297, 21.590560913085938]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 9.0, 9.0, 10.0, 11.0, 11.0, 16.0, 20.0, 26.0, 21.0, 22.0, 26.0, 22.0, 35.0, 29.0, 31.0, 33.0, 43.0, 32.0, 47.0, 44.0, 41.0, 43.0, 38.0, 41.0, 37.0, 37.0, 31.0, 26.0, 25.0, 25.0, 24.0, 14.0, 23.0, 23.0, 22.0, 7.0, 7.0, 5.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.892425537109375, -2.79852294921875, -2.704620361328125, -2.6107177734375, -2.516815185546875, -2.42291259765625, -2.329010009765625, -2.235107421875, -2.141204833984375, -2.04730224609375, -1.953399658203125, -1.8594970703125, -1.765594482421875, -1.67169189453125, -1.577789306640625, -1.48388671875, -1.389984130859375, -1.29608154296875, -1.202178955078125, -1.1082763671875, -1.014373779296875, -0.92047119140625, -0.826568603515625, -0.732666015625, -0.638763427734375, -0.54486083984375, -0.450958251953125, -0.3570556640625, -0.263153076171875, -0.16925048828125, -0.075347900390625, 0.0185546875, 0.112457275390625, 0.20635986328125, 0.300262451171875, 0.3941650390625, 0.488067626953125, 0.58197021484375, 0.675872802734375, 0.769775390625, 0.863677978515625, 0.95758056640625, 1.051483154296875, 1.1453857421875, 1.239288330078125, 1.33319091796875, 1.427093505859375, 1.52099609375, 1.614898681640625, 1.70880126953125, 1.802703857421875, 1.8966064453125, 1.990509033203125, 2.08441162109375, 2.178314208984375, 2.272216796875, 2.366119384765625, 2.46002197265625, 2.553924560546875, 2.6478271484375, 2.741729736328125, 2.83563232421875, 2.929534912109375, 3.0234375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 10.0, 28.0, 31.0, 45.0, 49.0, 88.0, 128.0, 161.0, 226.0, 340.0, 486.0, 693.0, 983.0, 1409.0, 2027.0, 3035.0, 4470.0, 6369.0, 9326.0, 13735.0, 20403.0, 30290.0, 47389.0, 77297.0, 140666.0, 259590.0, 175258.0, 92252.0, 54743.0, 34735.0, 23021.0, 15595.0, 10592.0, 7172.0, 4969.0, 3331.0, 2298.0, 1608.0, 1151.0, 757.0, 549.0, 385.0, 247.0, 166.0, 141.0, 94.0, 56.0, 52.0, 31.0, 26.0, 16.0, 10.0, 8.0, 8.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.485595703125, -0.4702568054199219, -0.45491790771484375, -0.4395790100097656, -0.4242401123046875, -0.4089012145996094, -0.39356231689453125, -0.3782234191894531, -0.362884521484375, -0.3475456237792969, -0.33220672607421875, -0.3168678283691406, -0.3015289306640625, -0.2861900329589844, -0.27085113525390625, -0.2555122375488281, -0.24017333984375, -0.22483444213867188, -0.20949554443359375, -0.19415664672851562, -0.1788177490234375, -0.16347885131835938, -0.14813995361328125, -0.13280105590820312, -0.117462158203125, -0.10212326049804688, -0.08678436279296875, -0.07144546508789062, -0.0561065673828125, -0.040767669677734375, -0.02542877197265625, -0.010089874267578125, 0.0052490234375, 0.020587921142578125, 0.03592681884765625, 0.051265716552734375, 0.0666046142578125, 0.08194351196289062, 0.09728240966796875, 0.11262130737304688, 0.127960205078125, 0.14329910278320312, 0.15863800048828125, 0.17397689819335938, 0.1893157958984375, 0.20465469360351562, 0.21999359130859375, 0.23533248901367188, 0.25067138671875, 0.2660102844238281, 0.28134918212890625, 0.2966880798339844, 0.3120269775390625, 0.3273658752441406, 0.34270477294921875, 0.3580436706542969, 0.373382568359375, 0.3887214660644531, 0.40406036376953125, 0.4193992614746094, 0.4347381591796875, 0.4500770568847656, 0.46541595458984375, 0.4807548522949219, 0.49609375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 1.0, 7.0, 4.0, 4.0, 9.0, 7.0, 12.0, 20.0, 11.0, 19.0, 18.0, 12.0, 20.0, 23.0, 15.0, 26.0, 41.0, 37.0, 36.0, 37.0, 42.0, 33.0, 40.0, 1064.0, 38.0, 51.0, 33.0, 39.0, 38.0, 34.0, 30.0, 28.0, 37.0, 24.0, 33.0, 20.0, 20.0, 9.0, 7.0, 10.0, 9.0, 2.0, 8.0, 12.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6103515625, -1.5503692626953125, -1.490386962890625, -1.4304046630859375, -1.37042236328125, -1.3104400634765625, -1.250457763671875, -1.1904754638671875, -1.1304931640625, -1.0705108642578125, -1.010528564453125, -0.9505462646484375, -0.89056396484375, -0.8305816650390625, -0.770599365234375, -0.7106170654296875, -0.650634765625, -0.5906524658203125, -0.530670166015625, -0.4706878662109375, -0.41070556640625, -0.3507232666015625, -0.290740966796875, -0.2307586669921875, -0.1707763671875, -0.1107940673828125, -0.050811767578125, 0.0091705322265625, 0.06915283203125, 0.1291351318359375, 0.189117431640625, 0.2490997314453125, 0.30908203125, 0.3690643310546875, 0.429046630859375, 0.4890289306640625, 0.54901123046875, 0.6089935302734375, 0.668975830078125, 0.7289581298828125, 0.7889404296875, 0.8489227294921875, 0.908905029296875, 0.9688873291015625, 1.02886962890625, 1.0888519287109375, 1.148834228515625, 1.2088165283203125, 1.268798828125, 1.3287811279296875, 1.388763427734375, 1.4487457275390625, 1.50872802734375, 1.5687103271484375, 1.628692626953125, 1.6886749267578125, 1.7486572265625, 1.8086395263671875, 1.868621826171875, 1.9286041259765625, 1.98858642578125, 2.0485687255859375, 2.108551025390625, 2.1685333251953125, 2.228515625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 10.0, 9.0, 8.0, 20.0, 21.0, 40.0, 64.0, 115.0, 148.0, 221.0, 394.0, 571.0, 866.0, 1230.0, 1871.0, 2716.0, 4013.0, 6053.0, 9267.0, 14453.0, 23339.0, 37949.0, 65605.0, 124167.0, 1323091.0, 225649.0, 105287.0, 56947.0, 33597.0, 20668.0, 13314.0, 8584.0, 5668.0, 3869.0, 2463.0, 1683.0, 1094.0, 737.0, 458.0, 287.0, 209.0, 122.0, 93.0, 57.0, 41.0, 17.0, 14.0, 17.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.49267578125, -0.475616455078125, -0.45855712890625, -0.441497802734375, -0.4244384765625, -0.407379150390625, -0.39031982421875, -0.373260498046875, -0.356201171875, -0.339141845703125, -0.32208251953125, -0.305023193359375, -0.2879638671875, -0.270904541015625, -0.25384521484375, -0.236785888671875, -0.2197265625, -0.202667236328125, -0.18560791015625, -0.168548583984375, -0.1514892578125, -0.134429931640625, -0.11737060546875, -0.100311279296875, -0.083251953125, -0.066192626953125, -0.04913330078125, -0.032073974609375, -0.0150146484375, 0.002044677734375, 0.01910400390625, 0.036163330078125, 0.05322265625, 0.070281982421875, 0.08734130859375, 0.104400634765625, 0.1214599609375, 0.138519287109375, 0.15557861328125, 0.172637939453125, 0.189697265625, 0.206756591796875, 0.22381591796875, 0.240875244140625, 0.2579345703125, 0.274993896484375, 0.29205322265625, 0.309112548828125, 0.326171875, 0.343231201171875, 0.36029052734375, 0.377349853515625, 0.3944091796875, 0.411468505859375, 0.42852783203125, 0.445587158203125, 0.462646484375, 0.479705810546875, 0.49676513671875, 0.513824462890625, 0.5308837890625, 0.547943115234375, 0.56500244140625, 0.582061767578125, 0.59912109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 4.0, 6.0, 9.0, 10.0, 8.0, 17.0, 21.0, 22.0, 17.0, 32.0, 37.0, 37.0, 34.0, 45.0, 48.0, 55.0, 50.0, 57.0, 46.0, 57.0, 55.0, 41.0, 38.0, 46.0, 31.0, 31.0, 39.0, 19.0, 13.0, 16.0, 13.0, 10.0, 7.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000232696533203125, -0.0002246946096420288, -0.00021669268608093262, -0.00020869076251983643, -0.00020068883895874023, -0.00019268691539764404, -0.00018468499183654785, -0.00017668306827545166, -0.00016868114471435547, -0.00016067922115325928, -0.00015267729759216309, -0.0001446753740310669, -0.0001366734504699707, -0.0001286715269088745, -0.00012066960334777832, -0.00011266767978668213, -0.00010466575622558594, -9.666383266448975e-05, -8.866190910339355e-05, -8.065998554229736e-05, -7.265806198120117e-05, -6.465613842010498e-05, -5.665421485900879e-05, -4.86522912979126e-05, -4.0650367736816406e-05, -3.2648444175720215e-05, -2.4646520614624023e-05, -1.6644597053527832e-05, -8.64267349243164e-06, -6.407499313354492e-07, 7.361173629760742e-06, 1.5363097190856934e-05, 2.3365020751953125e-05, 3.1366944313049316e-05, 3.936886787414551e-05, 4.73707914352417e-05, 5.537271499633789e-05, 6.337463855743408e-05, 7.137656211853027e-05, 7.937848567962646e-05, 8.738040924072266e-05, 9.538233280181885e-05, 0.00010338425636291504, 0.00011138617992401123, 0.00011938810348510742, 0.0001273900270462036, 0.0001353919506072998, 0.000143393874168396, 0.0001513957977294922, 0.00015939772129058838, 0.00016739964485168457, 0.00017540156841278076, 0.00018340349197387695, 0.00019140541553497314, 0.00019940733909606934, 0.00020740926265716553, 0.00021541118621826172, 0.0002234131097793579, 0.0002314150333404541, 0.0002394169569015503, 0.0002474188804626465, 0.0002554208040237427, 0.00026342272758483887, 0.00027142465114593506, 0.00027942657470703125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 7.0, 15.0, 19.0, 23.0, 25.0, 45.0, 51.0, 59.0, 76.0, 92.0, 125.0, 254.0, 513.0, 1477.0, 415731.0, 626699.0, 1806.0, 572.0, 271.0, 173.0, 110.0, 77.0, 61.0, 45.0, 51.0, 30.0, 29.0, 27.0, 14.0, 13.0, 9.0, 6.0, 11.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.006122589111328125, -0.005952715873718262, -0.0057828426361083984, -0.005612969398498535, -0.005443096160888672, -0.005273222923278809, -0.005103349685668945, -0.004933476448059082, -0.004763603210449219, -0.0045937299728393555, -0.004423856735229492, -0.004253983497619629, -0.004084110260009766, -0.003914237022399902, -0.003744363784790039, -0.0035744905471801758, -0.0034046173095703125, -0.0032347440719604492, -0.003064870834350586, -0.0028949975967407227, -0.0027251243591308594, -0.002555251121520996, -0.002385377883911133, -0.0022155046463012695, -0.0020456314086914062, -0.001875758171081543, -0.0017058849334716797, -0.0015360116958618164, -0.0013661384582519531, -0.0011962652206420898, -0.0010263919830322266, -0.0008565187454223633, -0.0006866455078125, -0.0005167722702026367, -0.00034689903259277344, -0.00017702579498291016, -7.152557373046875e-06, 0.0001627206802368164, 0.0003325939178466797, 0.000502467155456543, 0.0006723403930664062, 0.0008422136306762695, 0.0010120868682861328, 0.001181960105895996, 0.0013518333435058594, 0.0015217065811157227, 0.001691579818725586, 0.0018614530563354492, 0.0020313262939453125, 0.0022011995315551758, 0.002371072769165039, 0.0025409460067749023, 0.0027108192443847656, 0.002880692481994629, 0.003050565719604492, 0.0032204389572143555, 0.0033903121948242188, 0.003560185432434082, 0.0037300586700439453, 0.0038999319076538086, 0.004069805145263672, 0.004239678382873535, 0.0044095516204833984, 0.004579424858093262, 0.004749298095703125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 19.0, 28.0, 34.0, 76.0, 120.0, 126.0, 130.0, 133.0, 127.0, 81.0, 49.0, 41.0, 14.0, 13.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00014169173664413393, -0.00013415678404271603, -0.00012662183144129813, -0.00011908687883988023, -0.00011155191896250471, -0.00010401696636108682, -9.648201375966892e-05, -8.89470538822934e-05, -8.14121012808755e-05, -7.38771486794576e-05, -6.63421960780397e-05, -5.8807239838643e-05, -5.127228359924629e-05, -4.3737330997828394e-05, -3.6202378396410495e-05, -2.866742215701379e-05, -2.1132473193574697e-05, -1.3597518773167394e-05, -6.062565262254793e-06, 1.4723882486578077e-06, 9.00734266906511e-06, 1.6542297089472413e-05, 2.4077249690890312e-05, 3.161220593028702e-05, 3.914715853170492e-05, 4.668211113312282e-05, 5.421706737251952e-05, 6.175201997393742e-05, 6.928697257535532e-05, 7.682193245273083e-05, 8.435688505414873e-05, 9.189183765556663e-05, 9.942679025698453e-05, 0.00010696174285840243, 0.00011449669545982033, 0.00012203164806123823, 0.00012956660066265613, 0.00013710156781598926, 0.00014463652041740716, 0.00015217147301882505, 0.00015970642562024295, 0.00016724137822166085, 0.00017477633082307875, 0.00018231128342449665, 0.00018984623602591455, 0.00019738118862733245, 0.00020491614122875035, 0.00021245110838208348, 0.00021998604643158615, 0.00022752099903300405, 0.00023505595163442194, 0.00024259090423583984, 0.00025012585683725774, 0.00025766080943867564, 0.00026519576204009354, 0.00027273071464151144, 0.0002802656963467598, 0.0002878006489481777, 0.0002953356015495956, 0.0003028705541510135, 0.0003104055067524314, 0.0003179404593538493, 0.0003254754119552672, 0.0003330103645566851, 0.000340545317158103]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 7.0, 4.0, 2.0, 5.0, 11.0, 15.0, 11.0, 19.0, 10.0, 24.0, 31.0, 47.0, 23.0, 30.0, 33.0, 40.0, 39.0, 39.0, 39.0, 42.0, 38.0, 42.0, 37.0, 39.0, 41.0, 33.0, 35.0, 30.0, 28.0, 33.0, 29.0, 16.0, 19.0, 23.0, 19.0, 13.0, 14.0, 8.0, 5.0, 10.0, 2.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00014823675155639648, -0.0001438213512301445, -0.00013940595090389252, -0.00013499055057764053, -0.00013057515025138855, -0.00012615974992513657, -0.00012174434959888458, -0.0001173289492726326, -0.00011291354894638062, -0.00010849814862012863, -0.00010408274829387665, -9.966734796762466e-05, -9.525194764137268e-05, -9.08365473151207e-05, -8.642114698886871e-05, -8.200574666261673e-05, -7.759034633636475e-05, -7.317494601011276e-05, -6.875954568386078e-05, -6.43441453576088e-05, -5.992874503135681e-05, -5.551334470510483e-05, -5.1097944378852844e-05, -4.668254405260086e-05, -4.226714372634888e-05, -3.785174340009689e-05, -3.343634307384491e-05, -2.9020942747592926e-05, -2.4605542421340942e-05, -2.019014209508896e-05, -1.5774741768836975e-05, -1.1359341442584991e-05, -6.943941116333008e-06, -2.528540790081024e-06, 1.8868595361709595e-06, 6.302259862422943e-06, 1.0717660188674927e-05, 1.513306051492691e-05, 1.9548460841178894e-05, 2.3963861167430878e-05, 2.837926149368286e-05, 3.2794661819934845e-05, 3.721006214618683e-05, 4.162546247243881e-05, 4.6040862798690796e-05, 5.045626312494278e-05, 5.487166345119476e-05, 5.928706377744675e-05, 6.370246410369873e-05, 6.811786442995071e-05, 7.25332647562027e-05, 7.694866508245468e-05, 8.136406540870667e-05, 8.577946573495865e-05, 9.019486606121063e-05, 9.461026638746262e-05, 9.90256667137146e-05, 0.00010344106703996658, 0.00010785646736621857, 0.00011227186769247055, 0.00011668726801872253, 0.00012110266834497452, 0.0001255180686712265, 0.00012993346899747849, 0.00013434886932373047]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 9.0, 9.0, 10.0, 11.0, 11.0, 16.0, 20.0, 26.0, 21.0, 22.0, 26.0, 22.0, 35.0, 29.0, 31.0, 33.0, 43.0, 32.0, 47.0, 44.0, 41.0, 43.0, 38.0, 41.0, 37.0, 37.0, 31.0, 26.0, 25.0, 25.0, 24.0, 14.0, 23.0, 23.0, 22.0, 7.0, 7.0, 5.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.892425537109375, -2.79852294921875, -2.704620361328125, -2.6107177734375, -2.516815185546875, -2.42291259765625, -2.329010009765625, -2.235107421875, -2.141204833984375, -2.04730224609375, -1.953399658203125, -1.8594970703125, -1.765594482421875, -1.67169189453125, -1.577789306640625, -1.48388671875, -1.389984130859375, -1.29608154296875, -1.202178955078125, -1.1082763671875, -1.014373779296875, -0.92047119140625, -0.826568603515625, -0.732666015625, -0.638763427734375, -0.54486083984375, -0.450958251953125, -0.3570556640625, -0.263153076171875, -0.16925048828125, -0.075347900390625, 0.0185546875, 0.112457275390625, 0.20635986328125, 0.300262451171875, 0.3941650390625, 0.488067626953125, 0.58197021484375, 0.675872802734375, 0.769775390625, 0.863677978515625, 0.95758056640625, 1.051483154296875, 1.1453857421875, 1.239288330078125, 1.33319091796875, 1.427093505859375, 1.52099609375, 1.614898681640625, 1.70880126953125, 1.802703857421875, 1.8966064453125, 1.990509033203125, 2.08441162109375, 2.178314208984375, 2.272216796875, 2.366119384765625, 2.46002197265625, 2.553924560546875, 2.6478271484375, 2.741729736328125, 2.83563232421875, 2.929534912109375, 3.0234375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 9.0, 10.0, 20.0, 23.0, 37.0, 56.0, 69.0, 112.0, 242.0, 452.0, 1027.0, 2129.0, 4464.0, 9401.0, 19415.0, 43619.0, 110736.0, 291262.0, 336562.0, 133614.0, 52083.0, 22587.0, 10619.0, 5173.0, 2425.0, 1115.0, 566.0, 280.0, 137.0, 81.0, 49.0, 38.0, 34.0, 26.0, 14.0, 11.0, 7.0, 6.0, 7.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.821014404296875, -2.72406005859375, -2.627105712890625, -2.5301513671875, -2.433197021484375, -2.33624267578125, -2.239288330078125, -2.142333984375, -2.045379638671875, -1.94842529296875, -1.851470947265625, -1.7545166015625, -1.657562255859375, -1.56060791015625, -1.463653564453125, -1.36669921875, -1.269744873046875, -1.17279052734375, -1.075836181640625, -0.9788818359375, -0.881927490234375, -0.78497314453125, -0.688018798828125, -0.591064453125, -0.494110107421875, -0.39715576171875, -0.300201416015625, -0.2032470703125, -0.106292724609375, -0.00933837890625, 0.087615966796875, 0.1845703125, 0.281524658203125, 0.37847900390625, 0.475433349609375, 0.5723876953125, 0.669342041015625, 0.76629638671875, 0.863250732421875, 0.960205078125, 1.057159423828125, 1.15411376953125, 1.251068115234375, 1.3480224609375, 1.444976806640625, 1.54193115234375, 1.638885498046875, 1.73583984375, 1.832794189453125, 1.92974853515625, 2.026702880859375, 2.1236572265625, 2.220611572265625, 2.31756591796875, 2.414520263671875, 2.511474609375, 2.608428955078125, 2.70538330078125, 2.802337646484375, 2.8992919921875, 2.996246337890625, 3.09320068359375, 3.190155029296875, 3.287109375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 9.0, 9.0, 12.0, 13.0, 13.0, 19.0, 33.0, 23.0, 35.0, 27.0, 34.0, 49.0, 51.0, 71.0, 150.0, 452.0, 1468.0, 146.0, 73.0, 52.0, 53.0, 42.0, 35.0, 29.0, 23.0, 16.0, 14.0, 23.0, 16.0, 10.0, 9.0, 3.0, 5.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.46875, -13.02001953125, -12.5712890625, -12.12255859375, -11.673828125, -11.22509765625, -10.7763671875, -10.32763671875, -9.87890625, -9.43017578125, -8.9814453125, -8.53271484375, -8.083984375, -7.63525390625, -7.1865234375, -6.73779296875, -6.2890625, -5.84033203125, -5.3916015625, -4.94287109375, -4.494140625, -4.04541015625, -3.5966796875, -3.14794921875, -2.69921875, -2.25048828125, -1.8017578125, -1.35302734375, -0.904296875, -0.45556640625, -0.0068359375, 0.44189453125, 0.890625, 1.33935546875, 1.7880859375, 2.23681640625, 2.685546875, 3.13427734375, 3.5830078125, 4.03173828125, 4.48046875, 4.92919921875, 5.3779296875, 5.82666015625, 6.275390625, 6.72412109375, 7.1728515625, 7.62158203125, 8.0703125, 8.51904296875, 8.9677734375, 9.41650390625, 9.865234375, 10.31396484375, 10.7626953125, 11.21142578125, 11.66015625, 12.10888671875, 12.5576171875, 13.00634765625, 13.455078125, 13.90380859375, 14.3525390625, 14.80126953125, 15.25]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 10.0, 7.0, 18.0, 16.0, 20.0, 26.0, 24.0, 40.0, 40.0, 40.0, 93.0, 127.0, 187.0, 325.0, 580.0, 2871.0, 3029789.0, 109090.0, 1086.0, 432.0, 261.0, 156.0, 120.0, 89.0, 56.0, 39.0, 34.0, 20.0, 28.0, 24.0, 11.0, 16.0, 9.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.90625, -37.6826171875, -36.458984375, -35.2353515625, -34.01171875, -32.7880859375, -31.564453125, -30.3408203125, -29.1171875, -27.8935546875, -26.669921875, -25.4462890625, -24.22265625, -22.9990234375, -21.775390625, -20.5517578125, -19.328125, -18.1044921875, -16.880859375, -15.6572265625, -14.43359375, -13.2099609375, -11.986328125, -10.7626953125, -9.5390625, -8.3154296875, -7.091796875, -5.8681640625, -4.64453125, -3.4208984375, -2.197265625, -0.9736328125, 0.25, 1.4736328125, 2.697265625, 3.9208984375, 5.14453125, 6.3681640625, 7.591796875, 8.8154296875, 10.0390625, 11.2626953125, 12.486328125, 13.7099609375, 14.93359375, 16.1572265625, 17.380859375, 18.6044921875, 19.828125, 21.0517578125, 22.275390625, 23.4990234375, 24.72265625, 25.9462890625, 27.169921875, 28.3935546875, 29.6171875, 30.8408203125, 32.064453125, 33.2880859375, 34.51171875, 35.7353515625, 36.958984375, 38.1826171875, 39.40625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 22.0, 148.0, 372.0, 331.0, 109.0, 20.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.757884979248047, -26.49295425415039, -25.228025436401367, -23.96309471130371, -22.698165893554688, -21.43323516845703, -20.168304443359375, -18.90337371826172, -17.638444900512695, -16.37351417541504, -15.108585357666016, -13.84365463256836, -12.57872486114502, -11.31379508972168, -10.048864364624023, -8.783934593200684, -7.519004821777344, -6.254075050354004, -4.989144802093506, -3.724214792251587, -2.459284782409668, -1.1943550109863281, 0.07057523727416992, 1.335505485534668, 2.600435256958008, 3.8653652667999268, 5.130295276641846, 6.395225524902344, 7.660155296325684, 8.925085067749023, 10.19001579284668, 11.45494556427002, 12.719871520996094, 13.984801292419434, 15.249731063842773, 16.51466178894043, 17.779590606689453, 19.04452133178711, 20.309452056884766, 21.574382781982422, 22.839311599731445, 24.1042423248291, 25.369171142578125, 26.63410186767578, 27.899032592773438, 29.16396141052246, 30.428892135620117, 31.69382095336914, 32.9587516784668, 34.22368240356445, 35.48861312866211, 36.7535400390625, 38.018470764160156, 39.28340148925781, 40.54833221435547, 41.813262939453125, 43.07819366455078, 44.34312438964844, 45.608055114746094, 46.872982025146484, 48.13791275024414, 49.4028434753418, 50.66777420043945, 51.93270492553711, 53.1976318359375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 5.0, 6.0, 10.0, 10.0, 8.0, 17.0, 21.0, 17.0, 23.0, 25.0, 18.0, 22.0, 26.0, 40.0, 39.0, 32.0, 33.0, 36.0, 51.0, 24.0, 34.0, 50.0, 43.0, 39.0, 35.0, 42.0, 46.0, 34.0, 24.0, 27.0, 15.0, 26.0, 18.0, 16.0, 17.0, 5.0, 11.0, 16.0, 5.0, 6.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.774852752685547, -27.903209686279297, -27.031564712524414, -26.159921646118164, -25.28827667236328, -24.41663360595703, -23.54499053955078, -22.67334747314453, -21.80170249938965, -20.9300594329834, -20.058414459228516, -19.186771392822266, -18.315128326416016, -17.443483352661133, -16.571840286254883, -15.700196266174316, -14.82855224609375, -13.956908226013184, -13.085264205932617, -12.213621139526367, -11.3419771194458, -10.470333099365234, -9.598690032958984, -8.727046012878418, -7.855401992797852, -6.983757972717285, -6.112114429473877, -5.240470886230469, -4.368826866149902, -3.497182846069336, -2.6255393028259277, -1.7538957595825195, -0.8822498321533203, -0.010606050491333008, 0.8610377311706543, 1.7326815128326416, 2.604325294494629, 3.4759693145751953, 4.3476128578186035, 5.219256401062012, 6.090900421142578, 6.9625444412231445, 7.834187984466553, 8.705831527709961, 9.577475547790527, 10.449119567871094, 11.320762634277344, 12.19240665435791, 13.064050674438477, 13.935694694519043, 14.80733871459961, 15.67898178100586, 16.55062484741211, 17.422269821166992, 18.293912887573242, 19.165557861328125, 20.037200927734375, 20.908843994140625, 21.780488967895508, 22.652132034301758, 23.52377700805664, 24.39542007446289, 25.26706314086914, 26.13870620727539, 27.010351181030273]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 9.0, 9.0, 11.0, 10.0, 17.0, 20.0, 25.0, 22.0, 25.0, 28.0, 32.0, 27.0, 40.0, 35.0, 42.0, 41.0, 37.0, 34.0, 47.0, 40.0, 38.0, 41.0, 51.0, 34.0, 32.0, 29.0, 42.0, 24.0, 21.0, 17.0, 20.0, 22.0, 13.0, 9.0, 9.0, 14.0, 1.0, 6.0, 6.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4453125, -3.33453369140625, -3.2237548828125, -3.11297607421875, -3.002197265625, -2.89141845703125, -2.7806396484375, -2.66986083984375, -2.55908203125, -2.44830322265625, -2.3375244140625, -2.22674560546875, -2.115966796875, -2.00518798828125, -1.8944091796875, -1.78363037109375, -1.6728515625, -1.56207275390625, -1.4512939453125, -1.34051513671875, -1.229736328125, -1.11895751953125, -1.0081787109375, -0.89739990234375, -0.78662109375, -0.67584228515625, -0.5650634765625, -0.45428466796875, -0.343505859375, -0.23272705078125, -0.1219482421875, -0.01116943359375, 0.099609375, 0.21038818359375, 0.3211669921875, 0.43194580078125, 0.542724609375, 0.65350341796875, 0.7642822265625, 0.87506103515625, 0.98583984375, 1.09661865234375, 1.2073974609375, 1.31817626953125, 1.428955078125, 1.53973388671875, 1.6505126953125, 1.76129150390625, 1.8720703125, 1.98284912109375, 2.0936279296875, 2.20440673828125, 2.315185546875, 2.42596435546875, 2.5367431640625, 2.64752197265625, 2.75830078125, 2.86907958984375, 2.9798583984375, 3.09063720703125, 3.201416015625, 3.31219482421875, 3.4229736328125, 3.53375244140625, 3.64453125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 4.0, 5.0, 5.0, 9.0, 9.0, 18.0, 27.0, 25.0, 32.0, 34.0, 44.0, 64.0, 87.0, 102.0, 173.0, 315.0, 880.0, 4307.0, 141100.0, 2864240.0, 1155364.0, 24208.0, 1920.0, 498.0, 240.0, 142.0, 97.0, 63.0, 50.0, 48.0, 27.0, 36.0, 23.0, 22.0, 14.0, 13.0, 7.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.8680419921875, -9.525146484375, -9.1822509765625, -8.83935546875, -8.4964599609375, -8.153564453125, -7.8106689453125, -7.4677734375, -7.1248779296875, -6.781982421875, -6.4390869140625, -6.09619140625, -5.7532958984375, -5.410400390625, -5.0675048828125, -4.724609375, -4.3817138671875, -4.038818359375, -3.6959228515625, -3.35302734375, -3.0101318359375, -2.667236328125, -2.3243408203125, -1.9814453125, -1.6385498046875, -1.295654296875, -0.9527587890625, -0.60986328125, -0.2669677734375, 0.075927734375, 0.4188232421875, 0.76171875, 1.1046142578125, 1.447509765625, 1.7904052734375, 2.13330078125, 2.4761962890625, 2.819091796875, 3.1619873046875, 3.5048828125, 3.8477783203125, 4.190673828125, 4.5335693359375, 4.87646484375, 5.2193603515625, 5.562255859375, 5.9051513671875, 6.248046875, 6.5909423828125, 6.933837890625, 7.2767333984375, 7.61962890625, 7.9625244140625, 8.305419921875, 8.6483154296875, 8.9912109375, 9.3341064453125, 9.677001953125, 10.0198974609375, 10.36279296875, 10.7056884765625, 11.048583984375, 11.3914794921875, 11.734375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 19.0, 15.0, 27.0, 34.0, 58.0, 82.0, 98.0, 180.0, 241.0, 323.0, 441.0, 500.0, 468.0, 431.0, 318.0, 225.0, 169.0, 120.0, 99.0, 42.0, 43.0, 32.0, 20.0, 18.0, 18.0, 7.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.10601806640625, -5.8800048828125, -5.65399169921875, -5.427978515625, -5.20196533203125, -4.9759521484375, -4.74993896484375, -4.52392578125, -4.29791259765625, -4.0718994140625, -3.84588623046875, -3.619873046875, -3.39385986328125, -3.1678466796875, -2.94183349609375, -2.7158203125, -2.48980712890625, -2.2637939453125, -2.03778076171875, -1.811767578125, -1.58575439453125, -1.3597412109375, -1.13372802734375, -0.90771484375, -0.68170166015625, -0.4556884765625, -0.22967529296875, -0.003662109375, 0.22235107421875, 0.4483642578125, 0.67437744140625, 0.900390625, 1.12640380859375, 1.3524169921875, 1.57843017578125, 1.804443359375, 2.03045654296875, 2.2564697265625, 2.48248291015625, 2.70849609375, 2.93450927734375, 3.1605224609375, 3.38653564453125, 3.612548828125, 3.83856201171875, 4.0645751953125, 4.29058837890625, 4.5166015625, 4.74261474609375, 4.9686279296875, 5.19464111328125, 5.420654296875, 5.64666748046875, 5.8726806640625, 6.09869384765625, 6.32470703125, 6.55072021484375, 6.7767333984375, 7.00274658203125, 7.228759765625, 7.45477294921875, 7.6807861328125, 7.90679931640625, 8.1328125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 10.0, 15.0, 21.0, 32.0, 45.0, 56.0, 61.0, 144.0, 184.0, 257.0, 390.0, 725.0, 14677.0, 4105486.0, 69929.0, 907.0, 456.0, 271.0, 203.0, 124.0, 84.0, 61.0, 41.0, 15.0, 20.0, 17.0, 13.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.65625, -37.628173828125, -36.60009765625, -35.572021484375, -34.5439453125, -33.515869140625, -32.48779296875, -31.459716796875, -30.431640625, -29.403564453125, -28.37548828125, -27.347412109375, -26.3193359375, -25.291259765625, -24.26318359375, -23.235107421875, -22.20703125, -21.178955078125, -20.15087890625, -19.122802734375, -18.0947265625, -17.066650390625, -16.03857421875, -15.010498046875, -13.982421875, -12.954345703125, -11.92626953125, -10.898193359375, -9.8701171875, -8.842041015625, -7.81396484375, -6.785888671875, -5.7578125, -4.729736328125, -3.70166015625, -2.673583984375, -1.6455078125, -0.617431640625, 0.41064453125, 1.438720703125, 2.466796875, 3.494873046875, 4.52294921875, 5.551025390625, 6.5791015625, 7.607177734375, 8.63525390625, 9.663330078125, 10.69140625, 11.719482421875, 12.74755859375, 13.775634765625, 14.8037109375, 15.831787109375, 16.85986328125, 17.887939453125, 18.916015625, 19.944091796875, 20.97216796875, 22.000244140625, 23.0283203125, 24.056396484375, 25.08447265625, 26.112548828125, 27.140625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 10.0, 91.0, 430.0, 411.0, 69.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.77948760986328, -23.382638931274414, -19.985790252685547, -16.58894157409668, -13.192092895507812, -9.795244216918945, -6.398395538330078, -3.001546859741211, 0.39530181884765625, 3.7921504974365234, 7.188999176025391, 10.585847854614258, 13.982696533203125, 17.379545211791992, 20.77639389038086, 24.173242568969727, 27.570091247558594, 30.96693992614746, 34.36378860473633, 37.76063537597656, 41.15748596191406, 44.55433654785156, 47.9511833190918, 51.34803009033203, 54.74488067626953, 58.14173126220703, 61.538578033447266, 64.9354248046875, 68.332275390625, 71.7291259765625, 75.1259765625, 78.52281951904297, 81.919677734375, 85.3165283203125, 88.71337890625, 92.11022186279297, 95.50707244873047, 98.90392303466797, 102.30076599121094, 105.69761657714844, 109.09446716308594, 112.49131774902344, 115.88816833496094, 119.2850112915039, 122.6818618774414, 126.0787124633789, 129.47555541992188, 132.87240600585938, 136.26925659179688, 139.66610717773438, 143.06295776367188, 146.45980834960938, 149.85665893554688, 153.2534942626953, 156.6503448486328, 160.0471954345703, 163.4440460205078, 166.8408966064453, 170.2377471923828, 173.6345977783203, 177.03143310546875, 180.42828369140625, 183.82513427734375, 187.22198486328125, 190.61883544921875]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 5.0, 11.0, 10.0, 7.0, 6.0, 13.0, 16.0, 11.0, 29.0, 19.0, 29.0, 40.0, 41.0, 31.0, 36.0, 43.0, 36.0, 51.0, 47.0, 49.0, 49.0, 36.0, 47.0, 49.0, 43.0, 28.0, 32.0, 41.0, 21.0, 26.0, 13.0, 18.0, 15.0, 10.0, 9.0, 11.0, 6.0, 0.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.824111938476562, -21.110454559326172, -20.39679527282715, -19.683137893676758, -18.969478607177734, -18.255821228027344, -17.542163848876953, -16.82850456237793, -16.114845275878906, -15.4011869430542, -14.687528610229492, -13.973871231079102, -13.260211944580078, -12.546554565429688, -11.83289623260498, -11.119237899780273, -10.405580520629883, -9.691922187805176, -8.978263854980469, -8.264606475830078, -7.550947666168213, -6.837289333343506, -6.123631477355957, -5.40997314453125, -4.696314811706543, -3.982656478881836, -3.268998384475708, -2.55534029006958, -1.841681957244873, -1.128023624420166, -0.4143657684326172, 0.29929256439208984, 1.0129528045654297, 1.7266110181808472, 2.4402692317962646, 3.1539273262023926, 3.8675856590270996, 4.581243991851807, 5.2949018478393555, 6.0085601806640625, 6.7222185134887695, 7.435876846313477, 8.149535179138184, 8.86319351196289, 9.576850891113281, 10.290510177612305, 11.004167556762695, 11.717825889587402, 12.43148422241211, 13.145142555236816, 13.858800888061523, 14.572458267211914, 15.286117553710938, 15.999774932861328, 16.71343231201172, 17.427091598510742, 18.140750885009766, 18.854408264160156, 19.56806755065918, 20.28172492980957, 20.995384216308594, 21.709041595458984, 22.422698974609375, 23.1363582611084, 23.85001564025879]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 12.0, 7.0, 11.0, 9.0, 13.0, 15.0, 19.0, 20.0, 25.0, 23.0, 32.0, 28.0, 24.0, 39.0, 39.0, 36.0, 32.0, 48.0, 40.0, 30.0, 45.0, 38.0, 29.0, 33.0, 30.0, 35.0, 26.0, 31.0, 32.0, 35.0, 24.0, 23.0, 14.0, 14.0, 11.0, 14.0, 5.0, 9.0, 8.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-3.298828125, -3.205657958984375, -3.11248779296875, -3.019317626953125, -2.9261474609375, -2.832977294921875, -2.73980712890625, -2.646636962890625, -2.553466796875, -2.460296630859375, -2.36712646484375, -2.273956298828125, -2.1807861328125, -2.087615966796875, -1.99444580078125, -1.901275634765625, -1.80810546875, -1.714935302734375, -1.62176513671875, -1.528594970703125, -1.4354248046875, -1.342254638671875, -1.24908447265625, -1.155914306640625, -1.062744140625, -0.969573974609375, -0.87640380859375, -0.783233642578125, -0.6900634765625, -0.596893310546875, -0.50372314453125, -0.410552978515625, -0.3173828125, -0.224212646484375, -0.13104248046875, -0.037872314453125, 0.0552978515625, 0.148468017578125, 0.24163818359375, 0.334808349609375, 0.427978515625, 0.521148681640625, 0.61431884765625, 0.707489013671875, 0.8006591796875, 0.893829345703125, 0.98699951171875, 1.080169677734375, 1.17333984375, 1.266510009765625, 1.35968017578125, 1.452850341796875, 1.5460205078125, 1.639190673828125, 1.73236083984375, 1.825531005859375, 1.918701171875, 2.011871337890625, 2.10504150390625, 2.198211669921875, 2.2913818359375, 2.384552001953125, 2.47772216796875, 2.570892333984375, 2.6640625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 13.0, 19.0, 25.0, 33.0, 36.0, 65.0, 94.0, 157.0, 237.0, 318.0, 490.0, 707.0, 993.0, 1547.0, 2057.0, 2877.0, 4324.0, 6405.0, 9343.0, 13700.0, 20793.0, 32227.0, 50931.0, 84293.0, 154623.0, 264283.0, 160294.0, 87180.0, 51943.0, 33119.0, 21208.0, 13941.0, 9440.0, 6487.0, 4449.0, 3043.0, 2077.0, 1475.0, 991.0, 721.0, 531.0, 339.0, 213.0, 168.0, 122.0, 94.0, 58.0, 26.0, 22.0, 16.0, 7.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.479248046875, -0.4640464782714844, -0.44884490966796875, -0.4336433410644531, -0.4184417724609375, -0.4032402038574219, -0.38803863525390625, -0.3728370666503906, -0.357635498046875, -0.3424339294433594, -0.32723236083984375, -0.3120307922363281, -0.2968292236328125, -0.2816276550292969, -0.26642608642578125, -0.2512245178222656, -0.23602294921875, -0.22082138061523438, -0.20561981201171875, -0.19041824340820312, -0.1752166748046875, -0.16001510620117188, -0.14481353759765625, -0.12961196899414062, -0.114410400390625, -0.09920883178710938, -0.08400726318359375, -0.06880569458007812, -0.0536041259765625, -0.038402557373046875, -0.02320098876953125, -0.007999420166015625, 0.0072021484375, 0.022403717041015625, 0.03760528564453125, 0.052806854248046875, 0.0680084228515625, 0.08320999145507812, 0.09841156005859375, 0.11361312866210938, 0.128814697265625, 0.14401626586914062, 0.15921783447265625, 0.17441940307617188, 0.1896209716796875, 0.20482254028320312, 0.22002410888671875, 0.23522567749023438, 0.25042724609375, 0.2656288146972656, 0.28083038330078125, 0.2960319519042969, 0.3112335205078125, 0.3264350891113281, 0.34163665771484375, 0.3568382263183594, 0.372039794921875, 0.3872413635253906, 0.40244293212890625, 0.4176445007324219, 0.4328460693359375, 0.4480476379394531, 0.46324920654296875, 0.4784507751464844, 0.49365234375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 9.0, 5.0, 9.0, 18.0, 9.0, 14.0, 13.0, 21.0, 16.0, 18.0, 24.0, 25.0, 35.0, 22.0, 31.0, 35.0, 34.0, 40.0, 31.0, 32.0, 1059.0, 38.0, 40.0, 36.0, 38.0, 40.0, 33.0, 26.0, 27.0, 28.0, 23.0, 17.0, 29.0, 18.0, 21.0, 15.0, 17.0, 11.0, 7.0, 4.0, 7.0, 11.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.7978515625, -1.74188232421875, -1.6859130859375, -1.62994384765625, -1.573974609375, -1.51800537109375, -1.4620361328125, -1.40606689453125, -1.35009765625, -1.29412841796875, -1.2381591796875, -1.18218994140625, -1.126220703125, -1.07025146484375, -1.0142822265625, -0.95831298828125, -0.90234375, -0.84637451171875, -0.7904052734375, -0.73443603515625, -0.678466796875, -0.62249755859375, -0.5665283203125, -0.51055908203125, -0.45458984375, -0.39862060546875, -0.3426513671875, -0.28668212890625, -0.230712890625, -0.17474365234375, -0.1187744140625, -0.06280517578125, -0.0068359375, 0.04913330078125, 0.1051025390625, 0.16107177734375, 0.217041015625, 0.27301025390625, 0.3289794921875, 0.38494873046875, 0.44091796875, 0.49688720703125, 0.5528564453125, 0.60882568359375, 0.664794921875, 0.72076416015625, 0.7767333984375, 0.83270263671875, 0.888671875, 0.94464111328125, 1.0006103515625, 1.05657958984375, 1.112548828125, 1.16851806640625, 1.2244873046875, 1.28045654296875, 1.33642578125, 1.39239501953125, 1.4483642578125, 1.50433349609375, 1.560302734375, 1.61627197265625, 1.6722412109375, 1.72821044921875, 1.7841796875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 11.0, 9.0, 14.0, 32.0, 40.0, 69.0, 97.0, 133.0, 195.0, 312.0, 455.0, 614.0, 873.0, 1323.0, 1910.0, 2697.0, 3740.0, 5565.0, 8157.0, 12025.0, 18152.0, 27632.0, 43856.0, 72808.0, 131890.0, 1319190.0, 190860.0, 96179.0, 55855.0, 34280.0, 21985.0, 14690.0, 9678.0, 6725.0, 4602.0, 3167.0, 2222.0, 1574.0, 1082.0, 748.0, 529.0, 387.0, 243.0, 166.0, 117.0, 92.0, 52.0, 38.0, 21.0, 18.0, 11.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.5166015625, -0.5008277893066406, -0.48505401611328125, -0.4692802429199219, -0.4535064697265625, -0.4377326965332031, -0.42195892333984375, -0.4061851501464844, -0.390411376953125, -0.3746376037597656, -0.35886383056640625, -0.3430900573730469, -0.3273162841796875, -0.3115425109863281, -0.29576873779296875, -0.2799949645996094, -0.26422119140625, -0.24844741821289062, -0.23267364501953125, -0.21689987182617188, -0.2011260986328125, -0.18535232543945312, -0.16957855224609375, -0.15380477905273438, -0.138031005859375, -0.12225723266601562, -0.10648345947265625, -0.09070968627929688, -0.0749359130859375, -0.059162139892578125, -0.04338836669921875, -0.027614593505859375, -0.0118408203125, 0.003932952880859375, 0.01970672607421875, 0.035480499267578125, 0.0512542724609375, 0.06702804565429688, 0.08280181884765625, 0.09857559204101562, 0.114349365234375, 0.13012313842773438, 0.14589691162109375, 0.16167068481445312, 0.1774444580078125, 0.19321823120117188, 0.20899200439453125, 0.22476577758789062, 0.24053955078125, 0.2563133239746094, 0.27208709716796875, 0.2878608703613281, 0.3036346435546875, 0.3194084167480469, 0.33518218994140625, 0.3509559631347656, 0.366729736328125, 0.3825035095214844, 0.39827728271484375, 0.4140510559082031, 0.4298248291015625, 0.4455986022949219, 0.46137237548828125, 0.4771461486816406, 0.492919921875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 7.0, 9.0, 9.0, 13.0, 11.0, 15.0, 20.0, 22.0, 22.0, 38.0, 35.0, 43.0, 44.0, 61.0, 57.0, 56.0, 74.0, 61.0, 49.0, 56.0, 38.0, 49.0, 35.0, 23.0, 20.0, 23.0, 14.0, 15.0, 15.0, 5.0, 9.0, 10.0, 6.0, 4.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00033974647521972656, -0.0003298148512840271, -0.00031988322734832764, -0.0003099516034126282, -0.0003000199794769287, -0.00029008835554122925, -0.0002801567316055298, -0.0002702251076698303, -0.00026029348373413086, -0.0002503618597984314, -0.00024043023586273193, -0.00023049861192703247, -0.000220566987991333, -0.00021063536405563354, -0.00020070374011993408, -0.00019077211618423462, -0.00018084049224853516, -0.0001709088683128357, -0.00016097724437713623, -0.00015104562044143677, -0.0001411139965057373, -0.00013118237257003784, -0.00012125074863433838, -0.00011131912469863892, -0.00010138750076293945, -9.145587682723999e-05, -8.152425289154053e-05, -7.159262895584106e-05, -6.16610050201416e-05, -5.172938108444214e-05, -4.1797757148742676e-05, -3.186613321304321e-05, -2.193450927734375e-05, -1.2002885341644287e-05, -2.0712614059448242e-06, 7.860362529754639e-06, 1.77919864654541e-05, 2.7723610401153564e-05, 3.765523433685303e-05, 4.758685827255249e-05, 5.751848220825195e-05, 6.745010614395142e-05, 7.738173007965088e-05, 8.731335401535034e-05, 9.72449779510498e-05, 0.00010717660188674927, 0.00011710822582244873, 0.0001270398497581482, 0.00013697147369384766, 0.00014690309762954712, 0.00015683472156524658, 0.00016676634550094604, 0.0001766979694366455, 0.00018662959337234497, 0.00019656121730804443, 0.0002064928412437439, 0.00021642446517944336, 0.00022635608911514282, 0.00023628771305084229, 0.00024621933698654175, 0.0002561509609222412, 0.0002660825848579407, 0.00027601420879364014, 0.0002859458327293396, 0.00029587745666503906]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 8.0, 6.0, 4.0, 8.0, 9.0, 7.0, 9.0, 17.0, 23.0, 23.0, 27.0, 36.0, 58.0, 54.0, 76.0, 105.0, 194.0, 363.0, 779.0, 7791.0, 1031378.0, 5795.0, 742.0, 366.0, 185.0, 118.0, 76.0, 59.0, 44.0, 36.0, 30.0, 30.0, 20.0, 17.0, 12.0, 11.0, 8.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005908966064453125, -0.00570148229598999, -0.0054939985275268555, -0.005286514759063721, -0.005079030990600586, -0.004871547222137451, -0.004664063453674316, -0.004456579685211182, -0.004249095916748047, -0.004041612148284912, -0.0038341283798217773, -0.0036266446113586426, -0.003419160842895508, -0.003211677074432373, -0.0030041933059692383, -0.0027967095375061035, -0.0025892257690429688, -0.002381742000579834, -0.0021742582321166992, -0.0019667744636535645, -0.0017592906951904297, -0.001551806926727295, -0.0013443231582641602, -0.0011368393898010254, -0.0009293556213378906, -0.0007218718528747559, -0.0005143880844116211, -0.00030690431594848633, -9.942054748535156e-05, 0.0001080632209777832, 0.00031554698944091797, 0.0005230307579040527, 0.0007305145263671875, 0.0009379982948303223, 0.001145482063293457, 0.0013529658317565918, 0.0015604496002197266, 0.0017679333686828613, 0.001975417137145996, 0.002182900905609131, 0.0023903846740722656, 0.0025978684425354004, 0.002805352210998535, 0.00301283597946167, 0.0032203197479248047, 0.0034278035163879395, 0.0036352872848510742, 0.003842771053314209, 0.004050254821777344, 0.0042577385902404785, 0.004465222358703613, 0.004672706127166748, 0.004880189895629883, 0.005087673664093018, 0.005295157432556152, 0.005502641201019287, 0.005710124969482422, 0.005917608737945557, 0.006125092506408691, 0.006332576274871826, 0.006540060043334961, 0.006747543811798096, 0.0069550275802612305, 0.007162511348724365, 0.0073699951171875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 36.0, 127.0, 273.0, 281.0, 179.0, 78.0, 28.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006201037322171032, -0.000606104324106127, -0.0005921049742028117, -0.0005781055660918355, -0.0005641062161885202, -0.000550106808077544, -0.0005361074581742287, -0.0005221080500632524, -0.0005081087001599371, -0.0004941092920489609, -0.0004801099421456456, -0.00046611056313849986, -0.0004521111841313541, -0.0004381117760203779, -0.00042411242611706257, -0.00041011301800608635, -0.00039611360989511013, -0.00038211423088796437, -0.0003681148518808186, -0.00035411547287367284, -0.0003401160938665271, -0.00032611668575555086, -0.00031211733585223556, -0.00029811792774125934, -0.00028411857783794403, -0.00027011919883079827, -0.0002561198198236525, -0.00024212044081650674, -0.00022812104725744575, -0.0002141216682503, -0.00020012228924315423, -0.00018612289568409324, -0.00017212351667694747, -0.0001581241376698017, -0.00014412475866265595, -0.0001301253796555102, -0.0001161259860964492, -0.00010212660708930343, -8.812722808215767e-05, -7.41278417990543e-05, -6.012846279190853e-05, -4.612908014678396e-05, -3.212969750165939e-05, -1.813031849451363e-05, -4.130935849389061e-06, 9.868446795735508e-06, 2.386782580288127e-05, 3.786721208598465e-05, 5.186659109313041e-05, 6.586597010027617e-05, 7.986535638337955e-05, 9.386473539052531e-05, 0.00010786412167362869, 0.00012186350068077445, 0.0001358628796879202, 0.00014986225869506598, 0.00016386163770221174, 0.0001778610167093575, 0.00019186039571650326, 0.00020585977472364902, 0.00021985916828271002, 0.00023385854728985578, 0.00024785794084891677, 0.00026185731985606253, 0.0002758566988632083]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 3.0, 9.0, 17.0, 13.0, 14.0, 9.0, 17.0, 18.0, 23.0, 25.0, 20.0, 32.0, 19.0, 30.0, 41.0, 44.0, 37.0, 36.0, 50.0, 44.0, 33.0, 39.0, 35.0, 36.0, 43.0, 36.0, 29.0, 24.0, 29.0, 30.0, 22.0, 29.0, 18.0, 14.0, 16.0, 19.0, 15.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014156103134155273, -0.0001367218792438507, -0.00013188272714614868, -0.00012704357504844666, -0.00012220442295074463, -0.0001173652708530426, -0.00011252611875534058, -0.00010768696665763855, -0.00010284781455993652, -9.80086624622345e-05, -9.316951036453247e-05, -8.833035826683044e-05, -8.349120616912842e-05, -7.865205407142639e-05, -7.381290197372437e-05, -6.897374987602234e-05, -6.413459777832031e-05, -5.9295445680618286e-05, -5.445629358291626e-05, -4.9617141485214233e-05, -4.477798938751221e-05, -3.993883728981018e-05, -3.5099685192108154e-05, -3.0260533094406128e-05, -2.54213809967041e-05, -2.0582228899002075e-05, -1.574307680130005e-05, -1.0903924703598022e-05, -6.064772605895996e-06, -1.2256205081939697e-06, 3.6135315895080566e-06, 8.452683687210083e-06, 1.329183578491211e-05, 1.8130987882614136e-05, 2.2970139980316162e-05, 2.780929207801819e-05, 3.2648444175720215e-05, 3.748759627342224e-05, 4.232674837112427e-05, 4.7165900468826294e-05, 5.200505256652832e-05, 5.684420466423035e-05, 6.168335676193237e-05, 6.65225088596344e-05, 7.136166095733643e-05, 7.620081305503845e-05, 8.103996515274048e-05, 8.58791172504425e-05, 9.071826934814453e-05, 9.555742144584656e-05, 0.00010039657354354858, 0.00010523572564125061, 0.00011007487773895264, 0.00011491402983665466, 0.00011975318193435669, 0.00012459233403205872, 0.00012943148612976074, 0.00013427063822746277, 0.0001391097903251648, 0.00014394894242286682, 0.00014878809452056885, 0.00015362724661827087, 0.0001584663987159729, 0.00016330555081367493, 0.00016814470291137695]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 12.0, 7.0, 11.0, 9.0, 13.0, 15.0, 19.0, 20.0, 25.0, 23.0, 32.0, 28.0, 24.0, 39.0, 39.0, 36.0, 32.0, 48.0, 40.0, 30.0, 45.0, 38.0, 29.0, 33.0, 30.0, 35.0, 26.0, 31.0, 32.0, 35.0, 24.0, 23.0, 14.0, 14.0, 11.0, 14.0, 5.0, 9.0, 8.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-3.298828125, -3.205657958984375, -3.11248779296875, -3.019317626953125, -2.9261474609375, -2.832977294921875, -2.73980712890625, -2.646636962890625, -2.553466796875, -2.460296630859375, -2.36712646484375, -2.273956298828125, -2.1807861328125, -2.087615966796875, -1.99444580078125, -1.901275634765625, -1.80810546875, -1.714935302734375, -1.62176513671875, -1.528594970703125, -1.4354248046875, -1.342254638671875, -1.24908447265625, -1.155914306640625, -1.062744140625, -0.969573974609375, -0.87640380859375, -0.783233642578125, -0.6900634765625, -0.596893310546875, -0.50372314453125, -0.410552978515625, -0.3173828125, -0.224212646484375, -0.13104248046875, -0.037872314453125, 0.0552978515625, 0.148468017578125, 0.24163818359375, 0.334808349609375, 0.427978515625, 0.521148681640625, 0.61431884765625, 0.707489013671875, 0.8006591796875, 0.893829345703125, 0.98699951171875, 1.080169677734375, 1.17333984375, 1.266510009765625, 1.35968017578125, 1.452850341796875, 1.5460205078125, 1.639190673828125, 1.73236083984375, 1.825531005859375, 1.918701171875, 2.011871337890625, 2.10504150390625, 2.198211669921875, 2.2913818359375, 2.384552001953125, 2.47772216796875, 2.570892333984375, 2.6640625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 9.0, 7.0, 20.0, 14.0, 24.0, 29.0, 30.0, 39.0, 58.0, 80.0, 112.0, 142.0, 273.0, 495.0, 1010.0, 2377.0, 5800.0, 14689.0, 36508.0, 86675.0, 198967.0, 367400.0, 191269.0, 83299.0, 34925.0, 14155.0, 5571.0, 2280.0, 972.0, 476.0, 231.0, 168.0, 92.0, 72.0, 57.0, 57.0, 28.0, 30.0, 26.0, 21.0, 14.0, 15.0, 7.0, 10.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0], "bins": [-3.607421875, -3.5057373046875, -3.404052734375, -3.3023681640625, -3.20068359375, -3.0989990234375, -2.997314453125, -2.8956298828125, -2.7939453125, -2.6922607421875, -2.590576171875, -2.4888916015625, -2.38720703125, -2.2855224609375, -2.183837890625, -2.0821533203125, -1.98046875, -1.8787841796875, -1.777099609375, -1.6754150390625, -1.57373046875, -1.4720458984375, -1.370361328125, -1.2686767578125, -1.1669921875, -1.0653076171875, -0.963623046875, -0.8619384765625, -0.76025390625, -0.6585693359375, -0.556884765625, -0.4552001953125, -0.353515625, -0.2518310546875, -0.150146484375, -0.0484619140625, 0.05322265625, 0.1549072265625, 0.256591796875, 0.3582763671875, 0.4599609375, 0.5616455078125, 0.663330078125, 0.7650146484375, 0.86669921875, 0.9683837890625, 1.070068359375, 1.1717529296875, 1.2734375, 1.3751220703125, 1.476806640625, 1.5784912109375, 1.68017578125, 1.7818603515625, 1.883544921875, 1.9852294921875, 2.0869140625, 2.1885986328125, 2.290283203125, 2.3919677734375, 2.49365234375, 2.5953369140625, 2.697021484375, 2.7987060546875, 2.900390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 8.0, 6.0, 16.0, 10.0, 14.0, 16.0, 22.0, 31.0, 19.0, 28.0, 40.0, 28.0, 35.0, 43.0, 59.0, 73.0, 148.0, 351.0, 1455.0, 164.0, 83.0, 47.0, 36.0, 34.0, 38.0, 29.0, 30.0, 19.0, 30.0, 23.0, 22.0, 17.0, 10.0, 12.0, 11.0, 6.0, 8.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0625, -9.7275390625, -9.392578125, -9.0576171875, -8.72265625, -8.3876953125, -8.052734375, -7.7177734375, -7.3828125, -7.0478515625, -6.712890625, -6.3779296875, -6.04296875, -5.7080078125, -5.373046875, -5.0380859375, -4.703125, -4.3681640625, -4.033203125, -3.6982421875, -3.36328125, -3.0283203125, -2.693359375, -2.3583984375, -2.0234375, -1.6884765625, -1.353515625, -1.0185546875, -0.68359375, -0.3486328125, -0.013671875, 0.3212890625, 0.65625, 0.9912109375, 1.326171875, 1.6611328125, 1.99609375, 2.3310546875, 2.666015625, 3.0009765625, 3.3359375, 3.6708984375, 4.005859375, 4.3408203125, 4.67578125, 5.0107421875, 5.345703125, 5.6806640625, 6.015625, 6.3505859375, 6.685546875, 7.0205078125, 7.35546875, 7.6904296875, 8.025390625, 8.3603515625, 8.6953125, 9.0302734375, 9.365234375, 9.7001953125, 10.03515625, 10.3701171875, 10.705078125, 11.0400390625, 11.375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 10.0, 7.0, 6.0, 11.0, 11.0, 19.0, 13.0, 17.0, 27.0, 32.0, 54.0, 80.0, 116.0, 180.0, 280.0, 611.0, 1715.0, 528739.0, 2609977.0, 2233.0, 634.0, 319.0, 162.0, 116.0, 79.0, 60.0, 48.0, 32.0, 19.0, 22.0, 12.0, 15.0, 9.0, 8.0, 7.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.1875, -39.8173828125, -38.447265625, -37.0771484375, -35.70703125, -34.3369140625, -32.966796875, -31.5966796875, -30.2265625, -28.8564453125, -27.486328125, -26.1162109375, -24.74609375, -23.3759765625, -22.005859375, -20.6357421875, -19.265625, -17.8955078125, -16.525390625, -15.1552734375, -13.78515625, -12.4150390625, -11.044921875, -9.6748046875, -8.3046875, -6.9345703125, -5.564453125, -4.1943359375, -2.82421875, -1.4541015625, -0.083984375, 1.2861328125, 2.65625, 4.0263671875, 5.396484375, 6.7666015625, 8.13671875, 9.5068359375, 10.876953125, 12.2470703125, 13.6171875, 14.9873046875, 16.357421875, 17.7275390625, 19.09765625, 20.4677734375, 21.837890625, 23.2080078125, 24.578125, 25.9482421875, 27.318359375, 28.6884765625, 30.05859375, 31.4287109375, 32.798828125, 34.1689453125, 35.5390625, 36.9091796875, 38.279296875, 39.6494140625, 41.01953125, 42.3896484375, 43.759765625, 45.1298828125, 46.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 27.0, 153.0, 347.0, 315.0, 141.0, 22.0, 2.0, 2.0, 0.0, 1.0], "bins": [-69.21880340576172, -68.00346374511719, -66.78813171386719, -65.57279205322266, -64.35745239257812, -63.14211654663086, -61.926780700683594, -60.71144104003906, -59.4961051940918, -58.28076934814453, -57.0654296875, -55.850093841552734, -54.63475799560547, -53.41941833496094, -52.20408248901367, -50.988746643066406, -49.773406982421875, -48.55807113647461, -47.34273147583008, -46.12739562988281, -44.91205596923828, -43.696720123291016, -42.48138427734375, -41.26604461669922, -40.05070877075195, -38.83537292480469, -37.620033264160156, -36.40469741821289, -35.189361572265625, -33.974021911621094, -32.75868606567383, -31.54334831237793, -30.32801055908203, -29.112672805786133, -27.897335052490234, -26.68199920654297, -25.46666145324707, -24.251323699951172, -23.035987854003906, -21.820650100708008, -20.60531234741211, -19.38997459411621, -18.174636840820312, -16.959300994873047, -15.743963241577148, -14.52862548828125, -13.313288688659668, -12.097951889038086, -10.882614135742188, -9.667276382446289, -8.451939582824707, -7.236602306365967, -6.021265029907227, -4.805927753448486, -3.590590476989746, -2.375253677368164, -1.1599159240722656, 0.05542135238647461, 1.2707586288452148, 2.486095905303955, 3.7014331817626953, 4.9167704582214355, 6.132107734680176, 7.347444534301758, 8.562782287597656]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 9.0, 9.0, 8.0, 14.0, 13.0, 17.0, 23.0, 19.0, 25.0, 19.0, 31.0, 24.0, 35.0, 29.0, 37.0, 26.0, 40.0, 41.0, 38.0, 44.0, 35.0, 40.0, 41.0, 25.0, 33.0, 34.0, 31.0, 20.0, 32.0, 20.0, 27.0, 26.0, 21.0, 16.0, 15.0, 21.0, 6.0, 12.0, 7.0, 7.0, 6.0, 9.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.22670555114746, -20.48387336730957, -19.741043090820312, -18.998210906982422, -18.25537872314453, -17.512548446655273, -16.769716262817383, -16.026885986328125, -15.284053802490234, -14.54122257232666, -13.798391342163086, -13.055559158325195, -12.312727928161621, -11.569896697998047, -10.827064514160156, -10.084233283996582, -9.341402053833008, -8.598570823669434, -7.855739116668701, -7.112907409667969, -6.3700761795043945, -5.62724494934082, -4.884413242340088, -4.1415815353393555, -3.3987503051757812, -2.655918836593628, -1.9130873680114746, -1.1702558994293213, -0.42742443084716797, 0.31540703773498535, 1.0582385063171387, 1.801070213317871, 2.543903350830078, 3.2867348194122314, 4.029566287994385, 4.772397994995117, 5.515229225158691, 6.258060455322266, 7.000892162322998, 7.7437238693237305, 8.486555099487305, 9.229386329650879, 9.972217559814453, 10.715049743652344, 11.457880973815918, 12.200712203979492, 12.943544387817383, 13.686375617980957, 14.429206848144531, 15.172038078308105, 15.91486930847168, 16.65770149230957, 17.400531768798828, 18.14336395263672, 18.88619613647461, 19.6290283203125, 20.371858596801758, 21.11469078063965, 21.857521057128906, 22.600353240966797, 23.343185424804688, 24.086015701293945, 24.828847885131836, 25.571678161621094, 26.314510345458984]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 3.0, 8.0, 8.0, 13.0, 12.0, 11.0, 15.0, 24.0, 16.0, 28.0, 22.0, 24.0, 26.0, 31.0, 31.0, 31.0, 25.0, 40.0, 55.0, 43.0, 41.0, 31.0, 30.0, 35.0, 33.0, 37.0, 23.0, 30.0, 28.0, 26.0, 31.0, 23.0, 22.0, 19.0, 20.0, 21.0, 15.0, 19.0, 9.0, 5.0, 9.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.47265625, -3.370147705078125, -3.26763916015625, -3.165130615234375, -3.0626220703125, -2.960113525390625, -2.85760498046875, -2.755096435546875, -2.652587890625, -2.550079345703125, -2.44757080078125, -2.345062255859375, -2.2425537109375, -2.140045166015625, -2.03753662109375, -1.935028076171875, -1.83251953125, -1.730010986328125, -1.62750244140625, -1.524993896484375, -1.4224853515625, -1.319976806640625, -1.21746826171875, -1.114959716796875, -1.012451171875, -0.909942626953125, -0.80743408203125, -0.704925537109375, -0.6024169921875, -0.499908447265625, -0.39739990234375, -0.294891357421875, -0.1923828125, -0.089874267578125, 0.01263427734375, 0.115142822265625, 0.2176513671875, 0.320159912109375, 0.42266845703125, 0.525177001953125, 0.627685546875, 0.730194091796875, 0.83270263671875, 0.935211181640625, 1.0377197265625, 1.140228271484375, 1.24273681640625, 1.345245361328125, 1.44775390625, 1.550262451171875, 1.65277099609375, 1.755279541015625, 1.8577880859375, 1.960296630859375, 2.06280517578125, 2.165313720703125, 2.267822265625, 2.370330810546875, 2.47283935546875, 2.575347900390625, 2.6778564453125, 2.780364990234375, 2.88287353515625, 2.985382080078125, 3.087890625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 4.0, 8.0, 10.0, 18.0, 23.0, 19.0, 27.0, 26.0, 36.0, 45.0, 55.0, 54.0, 93.0, 103.0, 139.0, 204.0, 432.0, 1782.0, 32566.0, 1352374.0, 2666509.0, 133785.0, 4243.0, 699.0, 246.0, 134.0, 122.0, 99.0, 75.0, 56.0, 46.0, 45.0, 31.0, 29.0, 24.0, 26.0, 18.0, 17.0, 7.0, 10.0, 10.0, 0.0, 4.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0], "bins": [-11.296875, -10.96630859375, -10.6357421875, -10.30517578125, -9.974609375, -9.64404296875, -9.3134765625, -8.98291015625, -8.65234375, -8.32177734375, -7.9912109375, -7.66064453125, -7.330078125, -6.99951171875, -6.6689453125, -6.33837890625, -6.0078125, -5.67724609375, -5.3466796875, -5.01611328125, -4.685546875, -4.35498046875, -4.0244140625, -3.69384765625, -3.36328125, -3.03271484375, -2.7021484375, -2.37158203125, -2.041015625, -1.71044921875, -1.3798828125, -1.04931640625, -0.71875, -0.38818359375, -0.0576171875, 0.27294921875, 0.603515625, 0.93408203125, 1.2646484375, 1.59521484375, 1.92578125, 2.25634765625, 2.5869140625, 2.91748046875, 3.248046875, 3.57861328125, 3.9091796875, 4.23974609375, 4.5703125, 4.90087890625, 5.2314453125, 5.56201171875, 5.892578125, 6.22314453125, 6.5537109375, 6.88427734375, 7.21484375, 7.54541015625, 7.8759765625, 8.20654296875, 8.537109375, 8.86767578125, 9.1982421875, 9.52880859375, 9.859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 10.0, 13.0, 10.0, 14.0, 17.0, 22.0, 28.0, 28.0, 48.0, 72.0, 78.0, 122.0, 137.0, 198.0, 286.0, 381.0, 447.0, 459.0, 419.0, 341.0, 240.0, 185.0, 140.0, 97.0, 62.0, 53.0, 46.0, 27.0, 21.0, 20.0, 13.0, 12.0, 8.0, 6.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.5909423828125, -6.392822265625, -6.1947021484375, -5.99658203125, -5.7984619140625, -5.600341796875, -5.4022216796875, -5.2041015625, -5.0059814453125, -4.807861328125, -4.6097412109375, -4.41162109375, -4.2135009765625, -4.015380859375, -3.8172607421875, -3.619140625, -3.4210205078125, -3.222900390625, -3.0247802734375, -2.82666015625, -2.6285400390625, -2.430419921875, -2.2322998046875, -2.0341796875, -1.8360595703125, -1.637939453125, -1.4398193359375, -1.24169921875, -1.0435791015625, -0.845458984375, -0.6473388671875, -0.44921875, -0.2510986328125, -0.052978515625, 0.1451416015625, 0.34326171875, 0.5413818359375, 0.739501953125, 0.9376220703125, 1.1357421875, 1.3338623046875, 1.531982421875, 1.7301025390625, 1.92822265625, 2.1263427734375, 2.324462890625, 2.5225830078125, 2.720703125, 2.9188232421875, 3.116943359375, 3.3150634765625, 3.51318359375, 3.7113037109375, 3.909423828125, 4.1075439453125, 4.3056640625, 4.5037841796875, 4.701904296875, 4.9000244140625, 5.09814453125, 5.2962646484375, 5.494384765625, 5.6925048828125, 5.890625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 4.0, 8.0, 15.0, 15.0, 18.0, 28.0, 37.0, 40.0, 71.0, 87.0, 124.0, 191.0, 277.0, 402.0, 667.0, 13883.0, 4068152.0, 107829.0, 956.0, 406.0, 279.0, 209.0, 144.0, 116.0, 81.0, 54.0, 42.0, 31.0, 25.0, 16.0, 18.0, 10.0, 11.0, 8.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.875, -28.8671875, -27.859375, -26.8515625, -25.84375, -24.8359375, -23.828125, -22.8203125, -21.8125, -20.8046875, -19.796875, -18.7890625, -17.78125, -16.7734375, -15.765625, -14.7578125, -13.75, -12.7421875, -11.734375, -10.7265625, -9.71875, -8.7109375, -7.703125, -6.6953125, -5.6875, -4.6796875, -3.671875, -2.6640625, -1.65625, -0.6484375, 0.359375, 1.3671875, 2.375, 3.3828125, 4.390625, 5.3984375, 6.40625, 7.4140625, 8.421875, 9.4296875, 10.4375, 11.4453125, 12.453125, 13.4609375, 14.46875, 15.4765625, 16.484375, 17.4921875, 18.5, 19.5078125, 20.515625, 21.5234375, 22.53125, 23.5390625, 24.546875, 25.5546875, 26.5625, 27.5703125, 28.578125, 29.5859375, 30.59375, 31.6015625, 32.609375, 33.6171875, 34.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 48.0, 152.0, 313.0, 313.0, 143.0, 34.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.572322845458984, -29.463878631591797, -27.355432510375977, -25.246986389160156, -23.13854217529297, -21.03009796142578, -18.92165184020996, -16.81320571899414, -14.704761505126953, -12.59631633758545, -10.487871170043945, -8.379426002502441, -6.2709808349609375, -4.162535667419434, -2.0540904998779297, 0.05435466766357422, 2.162799835205078, 4.271245002746582, 6.379690170288086, 8.48813533782959, 10.596580505371094, 12.705025672912598, 14.813470840454102, 16.921916961669922, 19.03036117553711, 21.138805389404297, 23.247251510620117, 25.355697631835938, 27.464141845703125, 29.572586059570312, 31.681032180786133, 33.78947830200195, 35.897926330566406, 38.006370544433594, 40.11481475830078, 42.223262786865234, 44.33170700073242, 46.44015121459961, 48.54859924316406, 50.65704345703125, 52.76548767089844, 54.873931884765625, 56.98237609863281, 59.090824127197266, 61.19926834106445, 63.30771255493164, 65.4161605834961, 67.52460479736328, 69.63304901123047, 71.74149322509766, 73.84993743896484, 75.95838165283203, 78.06683349609375, 80.17527770996094, 82.28372192382812, 84.39216613769531, 86.5006103515625, 88.60905456542969, 90.71749877929688, 92.82594299316406, 94.93438720703125, 97.04283905029297, 99.15128326416016, 101.25972747802734, 103.36817169189453]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 10.0, 4.0, 5.0, 8.0, 7.0, 11.0, 12.0, 15.0, 16.0, 25.0, 18.0, 24.0, 32.0, 28.0, 30.0, 31.0, 47.0, 39.0, 36.0, 49.0, 36.0, 40.0, 36.0, 33.0, 46.0, 40.0, 52.0, 39.0, 32.0, 28.0, 30.0, 18.0, 20.0, 19.0, 12.0, 16.0, 18.0, 9.0, 9.0, 6.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.979713439941406, -22.316659927368164, -21.653608322143555, -20.990554809570312, -20.327503204345703, -19.66444969177246, -19.00139808654785, -18.33834457397461, -17.67529296875, -17.012239456176758, -16.34918785095215, -15.686135292053223, -15.023082733154297, -14.360029220581055, -13.696976661682129, -13.033924102783203, -12.370870590209961, -11.707818031311035, -11.04476547241211, -10.381712913513184, -9.718660354614258, -9.055606842041016, -8.39255428314209, -7.729501724243164, -7.066449165344238, -6.4033966064453125, -5.740344047546387, -5.077291011810303, -4.414238452911377, -3.751185894012451, -3.0881330966949463, -2.4250802993774414, -1.7620258331298828, -1.0989731550216675, -0.43592047691345215, 0.22713220119476318, 0.8901848793029785, 1.5532374382019043, 2.216290235519409, 2.879343032836914, 3.54239559173584, 4.205448150634766, 4.868500709533691, 5.531553745269775, 6.194606304168701, 6.857658863067627, 7.520711898803711, 8.183764457702637, 8.846817016601562, 9.509869575500488, 10.172922134399414, 10.83597469329834, 11.499027252197266, 12.162080764770508, 12.825133323669434, 13.48818588256836, 14.151238441467285, 14.814291000366211, 15.477343559265137, 16.140396118164062, 16.803449630737305, 17.466501235961914, 18.129554748535156, 18.792606353759766, 19.455659866333008]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 2.0, 5.0, 9.0, 12.0, 20.0, 19.0, 20.0, 24.0, 14.0, 34.0, 24.0, 33.0, 26.0, 28.0, 32.0, 32.0, 29.0, 45.0, 54.0, 31.0, 44.0, 39.0, 37.0, 38.0, 39.0, 44.0, 42.0, 33.0, 21.0, 30.0, 24.0, 19.0, 21.0, 15.0, 9.0, 7.0, 11.0, 9.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.472930908203125, -3.36578369140625, -3.258636474609375, -3.1514892578125, -3.044342041015625, -2.93719482421875, -2.830047607421875, -2.722900390625, -2.615753173828125, -2.50860595703125, -2.401458740234375, -2.2943115234375, -2.187164306640625, -2.08001708984375, -1.972869873046875, -1.86572265625, -1.758575439453125, -1.65142822265625, -1.544281005859375, -1.4371337890625, -1.329986572265625, -1.22283935546875, -1.115692138671875, -1.008544921875, -0.901397705078125, -0.79425048828125, -0.687103271484375, -0.5799560546875, -0.472808837890625, -0.36566162109375, -0.258514404296875, -0.1513671875, -0.044219970703125, 0.06292724609375, 0.170074462890625, 0.2772216796875, 0.384368896484375, 0.49151611328125, 0.598663330078125, 0.705810546875, 0.812957763671875, 0.92010498046875, 1.027252197265625, 1.1343994140625, 1.241546630859375, 1.34869384765625, 1.455841064453125, 1.56298828125, 1.670135498046875, 1.77728271484375, 1.884429931640625, 1.9915771484375, 2.098724365234375, 2.20587158203125, 2.313018798828125, 2.420166015625, 2.527313232421875, 2.63446044921875, 2.741607666015625, 2.8487548828125, 2.955902099609375, 3.06304931640625, 3.170196533203125, 3.27734375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 7.0, 7.0, 28.0, 25.0, 24.0, 38.0, 75.0, 111.0, 153.0, 232.0, 304.0, 465.0, 708.0, 994.0, 1375.0, 2013.0, 2846.0, 4301.0, 6010.0, 8886.0, 12490.0, 18304.0, 26968.0, 40852.0, 64013.0, 107949.0, 212449.0, 224806.0, 113778.0, 66679.0, 42513.0, 27692.0, 18796.0, 13148.0, 8884.0, 6214.0, 4451.0, 3141.0, 2034.0, 1442.0, 1045.0, 746.0, 438.0, 347.0, 257.0, 161.0, 121.0, 69.0, 57.0, 38.0, 26.0, 25.0, 6.0, 11.0, 3.0, 6.0, 2.0, 0.0, 3.0], "bins": [-0.52685546875, -0.5104141235351562, -0.4939727783203125, -0.47753143310546875, -0.461090087890625, -0.44464874267578125, -0.4282073974609375, -0.41176605224609375, -0.39532470703125, -0.37888336181640625, -0.3624420166015625, -0.34600067138671875, -0.329559326171875, -0.31311798095703125, -0.2966766357421875, -0.28023529052734375, -0.2637939453125, -0.24735260009765625, -0.2309112548828125, -0.21446990966796875, -0.198028564453125, -0.18158721923828125, -0.1651458740234375, -0.14870452880859375, -0.13226318359375, -0.11582183837890625, -0.0993804931640625, -0.08293914794921875, -0.066497802734375, -0.05005645751953125, -0.0336151123046875, -0.01717376708984375, -0.000732421875, 0.01570892333984375, 0.0321502685546875, 0.04859161376953125, 0.065032958984375, 0.08147430419921875, 0.0979156494140625, 0.11435699462890625, 0.13079833984375, 0.14723968505859375, 0.1636810302734375, 0.18012237548828125, 0.196563720703125, 0.21300506591796875, 0.2294464111328125, 0.24588775634765625, 0.2623291015625, 0.27877044677734375, 0.2952117919921875, 0.31165313720703125, 0.328094482421875, 0.34453582763671875, 0.3609771728515625, 0.37741851806640625, 0.39385986328125, 0.41030120849609375, 0.4267425537109375, 0.44318389892578125, 0.459625244140625, 0.47606658935546875, 0.4925079345703125, 0.5089492797851562, 0.525390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 8.0, 9.0, 9.0, 20.0, 14.0, 17.0, 21.0, 23.0, 27.0, 27.0, 21.0, 36.0, 30.0, 23.0, 38.0, 32.0, 41.0, 39.0, 42.0, 1057.0, 42.0, 51.0, 34.0, 35.0, 25.0, 35.0, 32.0, 24.0, 26.0, 28.0, 26.0, 15.0, 11.0, 15.0, 16.0, 7.0, 9.0, 9.0, 9.0, 2.0, 5.0, 1.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.9033203125, -1.842681884765625, -1.78204345703125, -1.721405029296875, -1.6607666015625, -1.600128173828125, -1.53948974609375, -1.478851318359375, -1.418212890625, -1.357574462890625, -1.29693603515625, -1.236297607421875, -1.1756591796875, -1.115020751953125, -1.05438232421875, -0.993743896484375, -0.93310546875, -0.872467041015625, -0.81182861328125, -0.751190185546875, -0.6905517578125, -0.629913330078125, -0.56927490234375, -0.508636474609375, -0.447998046875, -0.387359619140625, -0.32672119140625, -0.266082763671875, -0.2054443359375, -0.144805908203125, -0.08416748046875, -0.023529052734375, 0.037109375, 0.097747802734375, 0.15838623046875, 0.219024658203125, 0.2796630859375, 0.340301513671875, 0.40093994140625, 0.461578369140625, 0.522216796875, 0.582855224609375, 0.64349365234375, 0.704132080078125, 0.7647705078125, 0.825408935546875, 0.88604736328125, 0.946685791015625, 1.00732421875, 1.067962646484375, 1.12860107421875, 1.189239501953125, 1.2498779296875, 1.310516357421875, 1.37115478515625, 1.431793212890625, 1.492431640625, 1.553070068359375, 1.61370849609375, 1.674346923828125, 1.7349853515625, 1.795623779296875, 1.85626220703125, 1.916900634765625, 1.9775390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 5.0, 10.0, 7.0, 18.0, 41.0, 48.0, 64.0, 89.0, 141.0, 190.0, 289.0, 392.0, 534.0, 825.0, 1153.0, 1567.0, 2190.0, 3289.0, 4575.0, 6722.0, 9891.0, 14788.0, 22682.0, 35484.0, 57403.0, 98210.0, 197229.0, 1315729.0, 125963.0, 70962.0, 43171.0, 27499.0, 17915.0, 11998.0, 8029.0, 5571.0, 3780.0, 2637.0, 1781.0, 1302.0, 888.0, 619.0, 456.0, 340.0, 204.0, 141.0, 96.0, 65.0, 59.0, 35.0, 21.0, 15.0, 10.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.50830078125, -0.49201202392578125, -0.4757232666015625, -0.45943450927734375, -0.443145751953125, -0.42685699462890625, -0.4105682373046875, -0.39427947998046875, -0.37799072265625, -0.36170196533203125, -0.3454132080078125, -0.32912445068359375, -0.312835693359375, -0.29654693603515625, -0.2802581787109375, -0.26396942138671875, -0.2476806640625, -0.23139190673828125, -0.2151031494140625, -0.19881439208984375, -0.182525634765625, -0.16623687744140625, -0.1499481201171875, -0.13365936279296875, -0.11737060546875, -0.10108184814453125, -0.0847930908203125, -0.06850433349609375, -0.052215576171875, -0.03592681884765625, -0.0196380615234375, -0.00334930419921875, 0.012939453125, 0.02922821044921875, 0.0455169677734375, 0.06180572509765625, 0.078094482421875, 0.09438323974609375, 0.1106719970703125, 0.12696075439453125, 0.14324951171875, 0.15953826904296875, 0.1758270263671875, 0.19211578369140625, 0.208404541015625, 0.22469329833984375, 0.2409820556640625, 0.25727081298828125, 0.2735595703125, 0.28984832763671875, 0.3061370849609375, 0.32242584228515625, 0.338714599609375, 0.35500335693359375, 0.3712921142578125, 0.38758087158203125, 0.40386962890625, 0.42015838623046875, 0.4364471435546875, 0.45273590087890625, 0.469024658203125, 0.48531341552734375, 0.5016021728515625, 0.5178909301757812, 0.5341796875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 9.0, 13.0, 11.0, 18.0, 31.0, 34.0, 56.0, 64.0, 93.0, 73.0, 76.0, 99.0, 81.0, 70.0, 87.0, 43.0, 40.0, 26.0, 17.0, 17.0, 16.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000591278076171875, -0.0005702376365661621, -0.0005491971969604492, -0.0005281567573547363, -0.0005071163177490234, -0.00048607587814331055, -0.00046503543853759766, -0.00044399499893188477, -0.0004229545593261719, -0.000401914119720459, -0.0003808736801147461, -0.0003598332405090332, -0.0003387928009033203, -0.0003177523612976074, -0.00029671192169189453, -0.00027567148208618164, -0.00025463104248046875, -0.00023359060287475586, -0.00021255016326904297, -0.00019150972366333008, -0.0001704692840576172, -0.0001494288444519043, -0.0001283884048461914, -0.00010734796524047852, -8.630752563476562e-05, -6.526708602905273e-05, -4.4226646423339844e-05, -2.3186206817626953e-05, -2.1457672119140625e-06, 1.8894672393798828e-05, 3.993511199951172e-05, 6.097555160522461e-05, 8.20159912109375e-05, 0.00010305643081665039, 0.00012409687042236328, 0.00014513731002807617, 0.00016617774963378906, 0.00018721818923950195, 0.00020825862884521484, 0.00022929906845092773, 0.0002503395080566406, 0.0002713799476623535, 0.0002924203872680664, 0.0003134608268737793, 0.0003345012664794922, 0.0003555417060852051, 0.00037658214569091797, 0.00039762258529663086, 0.00041866302490234375, 0.00043970346450805664, 0.00046074390411376953, 0.0004817843437194824, 0.0005028247833251953, 0.0005238652229309082, 0.0005449056625366211, 0.000565946102142334, 0.0005869865417480469, 0.0006080269813537598, 0.0006290674209594727, 0.0006501078605651855, 0.0006711483001708984, 0.0006921887397766113, 0.0007132291793823242, 0.0007342696189880371, 0.00075531005859375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 14.0, 29.0, 41.0, 47.0, 49.0, 114.0, 142.0, 291.0, 830.0, 38302.0, 1006473.0, 1250.0, 376.0, 194.0, 120.0, 87.0, 58.0, 27.0, 23.0, 19.0, 13.0, 7.0, 4.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0155487060546875, -0.015118718147277832, -0.014688730239868164, -0.014258742332458496, -0.013828754425048828, -0.01339876651763916, -0.012968778610229492, -0.012538790702819824, -0.012108802795410156, -0.011678814888000488, -0.01124882698059082, -0.010818839073181152, -0.010388851165771484, -0.009958863258361816, -0.009528875350952148, -0.00909888744354248, -0.008668899536132812, -0.008238911628723145, -0.0078089237213134766, -0.007378935813903809, -0.006948947906494141, -0.006518959999084473, -0.006088972091674805, -0.005658984184265137, -0.005228996276855469, -0.004799008369445801, -0.004369020462036133, -0.003939032554626465, -0.003509044647216797, -0.003079056739807129, -0.002649068832397461, -0.002219080924987793, -0.001789093017578125, -0.001359105110168457, -0.0009291172027587891, -0.0004991292953491211, -6.914138793945312e-05, 0.00036084651947021484, 0.0007908344268798828, 0.0012208223342895508, 0.0016508102416992188, 0.0020807981491088867, 0.0025107860565185547, 0.0029407739639282227, 0.0033707618713378906, 0.0038007497787475586, 0.0042307376861572266, 0.0046607255935668945, 0.0050907135009765625, 0.0055207014083862305, 0.0059506893157958984, 0.006380677223205566, 0.006810665130615234, 0.007240653038024902, 0.00767064094543457, 0.008100628852844238, 0.008530616760253906, 0.008960604667663574, 0.009390592575073242, 0.00982058048248291, 0.010250568389892578, 0.010680556297302246, 0.011110544204711914, 0.011540532112121582, 0.01197052001953125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 41.0, 352.0, 510.0, 101.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0020160379353910685, -0.001980794593691826, -0.001945551368407905, -0.0019103080267086625, -0.00187506468500942, -0.0018398214597254992, -0.0018045781180262566, -0.001769334776327014, -0.0017340915510430932, -0.0016988482093438506, -0.0016636049840599298, -0.0016283616423606873, -0.0015931183006614447, -0.001557875075377524, -0.0015226317336782813, -0.0014873885083943605, -0.001452145166695118, -0.0014169018249958754, -0.0013816585997119546, -0.001346415258012712, -0.0013111719163134694, -0.0012759286910295486, -0.001240685349330306, -0.0012054420076310635, -0.0011701986659318209, -0.0011349553242325783, -0.0010997120989486575, -0.001064468757249415, -0.0010292254155501723, -0.0009939821902662516, -0.000958738848567009, -0.0009234955650754273, -0.0008882522815838456, -0.0008530089980922639, -0.0008177656563930213, -0.0007825223729014397, -0.000747279089409858, -0.0007120358059182763, -0.0006767924642190337, -0.000641549180727452, -0.0006063058972358704, -0.0005710626137442887, -0.0005358192720450461, -0.0005005759885534644, -0.00046533270506188273, -0.0004300893924664706, -0.00039484607987105846, -0.0003596027963794768, -0.0003243594546802342, -0.00028911614208482206, -0.0002538728585932404, -0.00021862954599782825, -0.00018338624795433134, -0.00014814294991083443, -0.0001128996373154223, -7.765635382384062e-05, -4.241304122842848e-05, -7.169739546952769e-06, 2.8073562134522945e-05, 6.331686745397747e-05, 9.856016549747437e-05, 0.00013380346354097128, 0.00016904677613638341, 0.0002042900596279651, 0.00023953337222337723]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 5.0, 8.0, 12.0, 12.0, 11.0, 17.0, 17.0, 21.0, 25.0, 37.0, 22.0, 23.0, 35.0, 37.0, 29.0, 30.0, 50.0, 38.0, 44.0, 63.0, 40.0, 32.0, 42.0, 31.0, 39.0, 22.0, 37.0, 30.0, 22.0, 35.0, 18.0, 16.0, 17.0, 12.0, 14.0, 8.0, 9.0, 5.0, 5.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00023794174194335938, -0.00023050233721733093, -0.0002230629324913025, -0.00021562352776527405, -0.0002081841230392456, -0.00020074471831321716, -0.00019330531358718872, -0.00018586590886116028, -0.00017842650413513184, -0.0001709870994091034, -0.00016354769468307495, -0.0001561082899570465, -0.00014866888523101807, -0.00014122948050498962, -0.00013379007577896118, -0.00012635067105293274, -0.0001189112663269043, -0.00011147186160087585, -0.00010403245687484741, -9.659305214881897e-05, -8.915364742279053e-05, -8.171424269676208e-05, -7.427483797073364e-05, -6.68354332447052e-05, -5.939602851867676e-05, -5.1956623792648315e-05, -4.451721906661987e-05, -3.707781434059143e-05, -2.9638409614562988e-05, -2.2199004888534546e-05, -1.4759600162506104e-05, -7.320195436477661e-06, 1.1920928955078125e-07, 7.558614015579224e-06, 1.4998018741607666e-05, 2.243742346763611e-05, 2.987682819366455e-05, 3.731623291969299e-05, 4.4755637645721436e-05, 5.219504237174988e-05, 5.963444709777832e-05, 6.707385182380676e-05, 7.45132565498352e-05, 8.195266127586365e-05, 8.939206600189209e-05, 9.683147072792053e-05, 0.00010427087545394897, 0.00011171028017997742, 0.00011914968490600586, 0.0001265890896320343, 0.00013402849435806274, 0.0001414678990840912, 0.00014890730381011963, 0.00015634670853614807, 0.00016378611326217651, 0.00017122551798820496, 0.0001786649227142334, 0.00018610432744026184, 0.00019354373216629028, 0.00020098313689231873, 0.00020842254161834717, 0.0002158619463443756, 0.00022330135107040405, 0.0002307407557964325, 0.00023818016052246094]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 2.0, 5.0, 9.0, 12.0, 20.0, 19.0, 20.0, 24.0, 14.0, 34.0, 24.0, 33.0, 26.0, 28.0, 32.0, 32.0, 29.0, 45.0, 54.0, 31.0, 44.0, 39.0, 37.0, 38.0, 39.0, 44.0, 42.0, 33.0, 21.0, 30.0, 24.0, 19.0, 21.0, 15.0, 9.0, 7.0, 11.0, 9.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.472930908203125, -3.36578369140625, -3.258636474609375, -3.1514892578125, -3.044342041015625, -2.93719482421875, -2.830047607421875, -2.722900390625, -2.615753173828125, -2.50860595703125, -2.401458740234375, -2.2943115234375, -2.187164306640625, -2.08001708984375, -1.972869873046875, -1.86572265625, -1.758575439453125, -1.65142822265625, -1.544281005859375, -1.4371337890625, -1.329986572265625, -1.22283935546875, -1.115692138671875, -1.008544921875, -0.901397705078125, -0.79425048828125, -0.687103271484375, -0.5799560546875, -0.472808837890625, -0.36566162109375, -0.258514404296875, -0.1513671875, -0.044219970703125, 0.06292724609375, 0.170074462890625, 0.2772216796875, 0.384368896484375, 0.49151611328125, 0.598663330078125, 0.705810546875, 0.812957763671875, 0.92010498046875, 1.027252197265625, 1.1343994140625, 1.241546630859375, 1.34869384765625, 1.455841064453125, 1.56298828125, 1.670135498046875, 1.77728271484375, 1.884429931640625, 1.9915771484375, 2.098724365234375, 2.20587158203125, 2.313018798828125, 2.420166015625, 2.527313232421875, 2.63446044921875, 2.741607666015625, 2.8487548828125, 2.955902099609375, 3.06304931640625, 3.170196533203125, 3.27734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 10.0, 11.0, 16.0, 24.0, 24.0, 27.0, 37.0, 53.0, 62.0, 98.0, 126.0, 169.0, 264.0, 567.0, 1548.0, 7210.0, 46621.0, 328456.0, 572347.0, 75160.0, 11730.0, 2138.0, 719.0, 369.0, 203.0, 141.0, 108.0, 63.0, 62.0, 44.0, 31.0, 20.0, 19.0, 15.0, 10.0, 15.0, 6.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.50018310546875, -7.2738037109375, -7.04742431640625, -6.821044921875, -6.59466552734375, -6.3682861328125, -6.14190673828125, -5.91552734375, -5.68914794921875, -5.4627685546875, -5.23638916015625, -5.010009765625, -4.78363037109375, -4.5572509765625, -4.33087158203125, -4.1044921875, -3.87811279296875, -3.6517333984375, -3.42535400390625, -3.198974609375, -2.97259521484375, -2.7462158203125, -2.51983642578125, -2.29345703125, -2.06707763671875, -1.8406982421875, -1.61431884765625, -1.387939453125, -1.16156005859375, -0.9351806640625, -0.70880126953125, -0.482421875, -0.25604248046875, -0.0296630859375, 0.19671630859375, 0.423095703125, 0.64947509765625, 0.8758544921875, 1.10223388671875, 1.32861328125, 1.55499267578125, 1.7813720703125, 2.00775146484375, 2.234130859375, 2.46051025390625, 2.6868896484375, 2.91326904296875, 3.1396484375, 3.36602783203125, 3.5924072265625, 3.81878662109375, 4.045166015625, 4.27154541015625, 4.4979248046875, 4.72430419921875, 4.95068359375, 5.17706298828125, 5.4034423828125, 5.62982177734375, 5.856201171875, 6.08258056640625, 6.3089599609375, 6.53533935546875, 6.76171875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 5.0, 12.0, 9.0, 16.0, 10.0, 15.0, 23.0, 22.0, 34.0, 30.0, 27.0, 38.0, 40.0, 43.0, 59.0, 71.0, 129.0, 352.0, 1465.0, 147.0, 78.0, 56.0, 45.0, 27.0, 30.0, 28.0, 33.0, 20.0, 19.0, 17.0, 18.0, 11.0, 15.0, 14.0, 13.0, 9.0, 7.0, 9.0, 6.0, 6.0, 5.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.7890625, -10.452880859375, -10.11669921875, -9.780517578125, -9.4443359375, -9.108154296875, -8.77197265625, -8.435791015625, -8.099609375, -7.763427734375, -7.42724609375, -7.091064453125, -6.7548828125, -6.418701171875, -6.08251953125, -5.746337890625, -5.41015625, -5.073974609375, -4.73779296875, -4.401611328125, -4.0654296875, -3.729248046875, -3.39306640625, -3.056884765625, -2.720703125, -2.384521484375, -2.04833984375, -1.712158203125, -1.3759765625, -1.039794921875, -0.70361328125, -0.367431640625, -0.03125, 0.304931640625, 0.64111328125, 0.977294921875, 1.3134765625, 1.649658203125, 1.98583984375, 2.322021484375, 2.658203125, 2.994384765625, 3.33056640625, 3.666748046875, 4.0029296875, 4.339111328125, 4.67529296875, 5.011474609375, 5.34765625, 5.683837890625, 6.02001953125, 6.356201171875, 6.6923828125, 7.028564453125, 7.36474609375, 7.700927734375, 8.037109375, 8.373291015625, 8.70947265625, 9.045654296875, 9.3818359375, 9.718017578125, 10.05419921875, 10.390380859375, 10.7265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 2.0, 9.0, 8.0, 8.0, 11.0, 16.0, 16.0, 24.0, 15.0, 40.0, 30.0, 43.0, 45.0, 55.0, 67.0, 81.0, 124.0, 208.0, 463.0, 1203.0, 21611.0, 3108733.0, 10698.0, 973.0, 406.0, 215.0, 136.0, 112.0, 82.0, 53.0, 46.0, 28.0, 32.0, 24.0, 30.0, 10.0, 12.0, 8.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.61279296875, -33.4755859375, -32.33837890625, -31.201171875, -30.06396484375, -28.9267578125, -27.78955078125, -26.65234375, -25.51513671875, -24.3779296875, -23.24072265625, -22.103515625, -20.96630859375, -19.8291015625, -18.69189453125, -17.5546875, -16.41748046875, -15.2802734375, -14.14306640625, -13.005859375, -11.86865234375, -10.7314453125, -9.59423828125, -8.45703125, -7.31982421875, -6.1826171875, -5.04541015625, -3.908203125, -2.77099609375, -1.6337890625, -0.49658203125, 0.640625, 1.77783203125, 2.9150390625, 4.05224609375, 5.189453125, 6.32666015625, 7.4638671875, 8.60107421875, 9.73828125, 10.87548828125, 12.0126953125, 13.14990234375, 14.287109375, 15.42431640625, 16.5615234375, 17.69873046875, 18.8359375, 19.97314453125, 21.1103515625, 22.24755859375, 23.384765625, 24.52197265625, 25.6591796875, 26.79638671875, 27.93359375, 29.07080078125, 30.2080078125, 31.34521484375, 32.482421875, 33.61962890625, 34.7568359375, 35.89404296875, 37.03125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 22.0, 89.0, 284.0, 360.0, 210.0, 43.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.74382781982422, -51.605743408203125, -50.46765899658203, -49.32957077026367, -48.19148635864258, -47.053401947021484, -45.91531753540039, -44.77722930908203, -43.63914489746094, -42.501060485839844, -41.36297607421875, -40.22488784790039, -39.0868034362793, -37.9487190246582, -36.81063461303711, -35.67254638671875, -34.534461975097656, -33.39637756347656, -32.25829315185547, -31.120206832885742, -29.982120513916016, -28.844036102294922, -27.705951690673828, -26.5678653717041, -25.42978286743164, -24.291698455810547, -23.15361213684082, -22.015527725219727, -20.87744140625, -19.739356994628906, -18.601272583007812, -17.463186264038086, -16.32509994506836, -15.18701457977295, -14.048929214477539, -12.910844802856445, -11.772758483886719, -10.634674072265625, -9.496588706970215, -8.358503341674805, -7.2204179763793945, -6.082332611083984, -4.944247245788574, -3.8061623573303223, -2.668076992034912, -1.529991626739502, -0.39190673828125, 0.7461786270141602, 1.8842639923095703, 3.0223493576049805, 4.160434722900391, 5.298519611358643, 6.436604976654053, 7.574690341949463, 8.712775230407715, 9.850860595703125, 10.988945960998535, 12.127031326293945, 13.265116691589355, 14.403202056884766, 15.54128646850586, 16.679372787475586, 17.81745719909668, 18.955543518066406, 20.0936279296875]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 12.0, 11.0, 16.0, 14.0, 13.0, 36.0, 23.0, 28.0, 37.0, 38.0, 46.0, 41.0, 47.0, 51.0, 50.0, 57.0, 57.0, 48.0, 61.0, 44.0, 42.0, 39.0, 26.0, 33.0, 22.0, 23.0, 13.0, 12.0, 18.0, 7.0, 10.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.57958221435547, -50.222007751464844, -48.86442947387695, -47.50685501098633, -46.14927673339844, -44.79170227050781, -43.43412780761719, -42.0765495300293, -40.71897506713867, -39.36140060424805, -38.003822326660156, -36.64624786376953, -35.28866958618164, -33.931095123291016, -32.573516845703125, -31.2159423828125, -29.858366012573242, -28.500789642333984, -27.143213272094727, -25.78563690185547, -24.428062438964844, -23.070486068725586, -21.712909698486328, -20.355335235595703, -18.997756958007812, -17.640180587768555, -16.282604217529297, -14.925028800964355, -13.567453384399414, -12.209877014160156, -10.852300643920898, -9.494725227355957, -8.137149810791016, -6.779573917388916, -5.421998023986816, -4.064421653747559, -2.706845760345459, -1.3492698669433594, 0.008306503295898438, 1.3658819198608398, 2.7234582901000977, 4.081034183502197, 5.438610076904297, 6.796186447143555, 8.153762817382812, 9.511338233947754, 10.868914604187012, 12.226490020751953, 13.584066390991211, 14.941642761230469, 16.299219131469727, 17.656795501708984, 19.01436996459961, 20.371946334838867, 21.729522705078125, 23.08709716796875, 24.44467544555664, 25.8022518157959, 27.159828186035156, 28.51740264892578, 29.87497901916504, 31.232555389404297, 32.59013366699219, 33.94770812988281, 35.30528259277344]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 4.0, 9.0, 8.0, 14.0, 13.0, 25.0, 24.0, 27.0, 22.0, 27.0, 31.0, 30.0, 29.0, 35.0, 35.0, 41.0, 40.0, 39.0, 41.0, 54.0, 47.0, 23.0, 47.0, 44.0, 34.0, 43.0, 29.0, 28.0, 20.0, 31.0, 14.0, 22.0, 17.0, 1.0, 10.0, 4.0, 11.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.121795654296875, -3.99359130859375, -3.865386962890625, -3.7371826171875, -3.608978271484375, -3.48077392578125, -3.352569580078125, -3.224365234375, -3.096160888671875, -2.96795654296875, -2.839752197265625, -2.7115478515625, -2.583343505859375, -2.45513916015625, -2.326934814453125, -2.19873046875, -2.070526123046875, -1.94232177734375, -1.814117431640625, -1.6859130859375, -1.557708740234375, -1.42950439453125, -1.301300048828125, -1.173095703125, -1.044891357421875, -0.91668701171875, -0.788482666015625, -0.6602783203125, -0.532073974609375, -0.40386962890625, -0.275665283203125, -0.1474609375, -0.019256591796875, 0.10894775390625, 0.237152099609375, 0.3653564453125, 0.493560791015625, 0.62176513671875, 0.749969482421875, 0.878173828125, 1.006378173828125, 1.13458251953125, 1.262786865234375, 1.3909912109375, 1.519195556640625, 1.64739990234375, 1.775604248046875, 1.90380859375, 2.032012939453125, 2.16021728515625, 2.288421630859375, 2.4166259765625, 2.544830322265625, 2.67303466796875, 2.801239013671875, 2.929443359375, 3.057647705078125, 3.18585205078125, 3.314056396484375, 3.4422607421875, 3.570465087890625, 3.69866943359375, 3.826873779296875, 3.955078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 3.0, 12.0, 6.0, 13.0, 17.0, 23.0, 20.0, 39.0, 32.0, 47.0, 65.0, 90.0, 152.0, 237.0, 397.0, 793.0, 2226.0, 10856.0, 79154.0, 524677.0, 1629817.0, 1448927.0, 421252.0, 63009.0, 8751.0, 1964.0, 712.0, 321.0, 213.0, 126.0, 70.0, 68.0, 41.0, 34.0, 24.0, 25.0, 20.0, 14.0, 7.0, 4.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.60546875, -5.43524169921875, -5.2650146484375, -5.09478759765625, -4.924560546875, -4.75433349609375, -4.5841064453125, -4.41387939453125, -4.24365234375, -4.07342529296875, -3.9031982421875, -3.73297119140625, -3.562744140625, -3.39251708984375, -3.2222900390625, -3.05206298828125, -2.8818359375, -2.71160888671875, -2.5413818359375, -2.37115478515625, -2.200927734375, -2.03070068359375, -1.8604736328125, -1.69024658203125, -1.52001953125, -1.34979248046875, -1.1795654296875, -1.00933837890625, -0.839111328125, -0.66888427734375, -0.4986572265625, -0.32843017578125, -0.158203125, 0.01202392578125, 0.1822509765625, 0.35247802734375, 0.522705078125, 0.69293212890625, 0.8631591796875, 1.03338623046875, 1.20361328125, 1.37384033203125, 1.5440673828125, 1.71429443359375, 1.884521484375, 2.05474853515625, 2.2249755859375, 2.39520263671875, 2.5654296875, 2.73565673828125, 2.9058837890625, 3.07611083984375, 3.246337890625, 3.41656494140625, 3.5867919921875, 3.75701904296875, 3.92724609375, 4.09747314453125, 4.2677001953125, 4.43792724609375, 4.608154296875, 4.77838134765625, 4.9486083984375, 5.11883544921875, 5.2890625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 6.0, 11.0, 13.0, 17.0, 16.0, 31.0, 50.0, 48.0, 67.0, 97.0, 134.0, 169.0, 247.0, 305.0, 388.0, 456.0, 423.0, 395.0, 299.0, 235.0, 188.0, 132.0, 81.0, 70.0, 50.0, 33.0, 23.0, 19.0, 15.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.49609375, -7.2811279296875, -7.066162109375, -6.8511962890625, -6.63623046875, -6.4212646484375, -6.206298828125, -5.9913330078125, -5.7763671875, -5.5614013671875, -5.346435546875, -5.1314697265625, -4.91650390625, -4.7015380859375, -4.486572265625, -4.2716064453125, -4.056640625, -3.8416748046875, -3.626708984375, -3.4117431640625, -3.19677734375, -2.9818115234375, -2.766845703125, -2.5518798828125, -2.3369140625, -2.1219482421875, -1.906982421875, -1.6920166015625, -1.47705078125, -1.2620849609375, -1.047119140625, -0.8321533203125, -0.6171875, -0.4022216796875, -0.187255859375, 0.0277099609375, 0.24267578125, 0.4576416015625, 0.672607421875, 0.8875732421875, 1.1025390625, 1.3175048828125, 1.532470703125, 1.7474365234375, 1.96240234375, 2.1773681640625, 2.392333984375, 2.6072998046875, 2.822265625, 3.0372314453125, 3.252197265625, 3.4671630859375, 3.68212890625, 3.8970947265625, 4.112060546875, 4.3270263671875, 4.5419921875, 4.7569580078125, 4.971923828125, 5.1868896484375, 5.40185546875, 5.6168212890625, 5.831787109375, 6.0467529296875, 6.26171875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 11.0, 19.0, 17.0, 26.0, 26.0, 52.0, 68.0, 118.0, 165.0, 261.0, 446.0, 747.0, 1618.0, 10611.0, 3220024.0, 952049.0, 5007.0, 1323.0, 589.0, 358.0, 238.0, 148.0, 107.0, 62.0, 52.0, 42.0, 23.0, 12.0, 9.0, 14.0, 6.0, 7.0, 3.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.715087890625, -19.91455078125, -19.114013671875, -18.3134765625, -17.512939453125, -16.71240234375, -15.911865234375, -15.111328125, -14.310791015625, -13.51025390625, -12.709716796875, -11.9091796875, -11.108642578125, -10.30810546875, -9.507568359375, -8.70703125, -7.906494140625, -7.10595703125, -6.305419921875, -5.5048828125, -4.704345703125, -3.90380859375, -3.103271484375, -2.302734375, -1.502197265625, -0.70166015625, 0.098876953125, 0.8994140625, 1.699951171875, 2.50048828125, 3.301025390625, 4.1015625, 4.902099609375, 5.70263671875, 6.503173828125, 7.3037109375, 8.104248046875, 8.90478515625, 9.705322265625, 10.505859375, 11.306396484375, 12.10693359375, 12.907470703125, 13.7080078125, 14.508544921875, 15.30908203125, 16.109619140625, 16.91015625, 17.710693359375, 18.51123046875, 19.311767578125, 20.1123046875, 20.912841796875, 21.71337890625, 22.513916015625, 23.314453125, 24.114990234375, 24.91552734375, 25.716064453125, 26.5166015625, 27.317138671875, 28.11767578125, 28.918212890625, 29.71875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 42.0, 386.0, 498.0, 86.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-136.50393676757812, -132.3837890625, -128.26364135742188, -124.14350891113281, -120.02336120605469, -115.90321350097656, -111.78307342529297, -107.66293334960938, -103.54278564453125, -99.42263793945312, -95.30249786376953, -91.18235778808594, -87.06221008300781, -82.94206237792969, -78.8219223022461, -74.7017822265625, -70.58163452148438, -66.46148681640625, -62.341346740722656, -58.2212028503418, -54.10105895996094, -49.98091506958008, -45.86077117919922, -41.74062728881836, -37.6204833984375, -33.50033950805664, -29.38019561767578, -25.260051727294922, -21.139907836914062, -17.019763946533203, -12.899620056152344, -8.779476165771484, -4.6593170166015625, -0.5391731262207031, 3.5809707641601562, 7.701114654541016, 11.821258544921875, 15.941402435302734, 20.061546325683594, 24.181690216064453, 28.301834106445312, 32.42197799682617, 36.54212188720703, 40.66226577758789, 44.78240966796875, 48.90255355834961, 53.02269744873047, 57.14284133911133, 61.26298522949219, 65.38313293457031, 69.5032730102539, 73.6234130859375, 77.74356079101562, 81.86370849609375, 85.98384857177734, 90.10398864746094, 94.22413635253906, 98.34428405761719, 102.46442413330078, 106.58456420898438, 110.7047119140625, 114.82485961914062, 118.94499969482422, 123.06513977050781, 127.18528747558594]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 8.0, 3.0, 6.0, 10.0, 19.0, 14.0, 12.0, 19.0, 30.0, 33.0, 39.0, 36.0, 44.0, 32.0, 52.0, 48.0, 47.0, 43.0, 40.0, 48.0, 47.0, 39.0, 48.0, 39.0, 35.0, 28.0, 31.0, 30.0, 15.0, 16.0, 15.0, 15.0, 10.0, 3.0, 14.0, 8.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.92617416381836, -22.146080017089844, -21.365985870361328, -20.585891723632812, -19.805795669555664, -19.02570152282715, -18.245607376098633, -17.465513229370117, -16.68541717529297, -15.905323028564453, -15.125227928161621, -14.345133781433105, -13.565038681030273, -12.784944534301758, -12.004850387573242, -11.224756240844727, -10.444662094116211, -9.664567947387695, -8.884472846984863, -8.104378700256348, -7.324284076690674, -6.544189453125, -5.764095306396484, -4.9840006828308105, -4.203906059265137, -3.423811435699463, -2.643717050552368, -1.8636226654052734, -1.0835280418395996, -0.3034334182739258, 0.47666072845458984, 1.2567553520202637, 2.0368499755859375, 2.8169445991516113, 3.597038984298706, 4.377133369445801, 5.157227993011475, 5.937322616577148, 6.717416763305664, 7.497511386871338, 8.277606010437012, 9.057700157165527, 9.83779525756836, 10.617889404296875, 11.39798355102539, 12.178078651428223, 12.958172798156738, 13.73826789855957, 14.518362045288086, 15.298456192016602, 16.078550338745117, 16.858646392822266, 17.63874053955078, 18.418834686279297, 19.198928833007812, 19.979022979736328, 20.759117126464844, 21.53921127319336, 22.319305419921875, 23.09939956665039, 23.87949562072754, 24.659589767456055, 25.43968391418457, 26.219778060913086, 26.999874114990234]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 10.0, 5.0, 9.0, 7.0, 10.0, 3.0, 20.0, 14.0, 20.0, 20.0, 26.0, 29.0, 21.0, 24.0, 35.0, 35.0, 31.0, 43.0, 35.0, 38.0, 39.0, 36.0, 36.0, 49.0, 48.0, 37.0, 35.0, 30.0, 31.0, 26.0, 28.0, 22.0, 22.0, 20.0, 19.0, 16.0, 15.0, 16.0, 10.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.515625, -3.40960693359375, -3.3035888671875, -3.19757080078125, -3.091552734375, -2.98553466796875, -2.8795166015625, -2.77349853515625, -2.66748046875, -2.56146240234375, -2.4554443359375, -2.34942626953125, -2.243408203125, -2.13739013671875, -2.0313720703125, -1.92535400390625, -1.8193359375, -1.71331787109375, -1.6072998046875, -1.50128173828125, -1.395263671875, -1.28924560546875, -1.1832275390625, -1.07720947265625, -0.97119140625, -0.86517333984375, -0.7591552734375, -0.65313720703125, -0.547119140625, -0.44110107421875, -0.3350830078125, -0.22906494140625, -0.123046875, -0.01702880859375, 0.0889892578125, 0.19500732421875, 0.301025390625, 0.40704345703125, 0.5130615234375, 0.61907958984375, 0.72509765625, 0.83111572265625, 0.9371337890625, 1.04315185546875, 1.149169921875, 1.25518798828125, 1.3612060546875, 1.46722412109375, 1.5732421875, 1.67926025390625, 1.7852783203125, 1.89129638671875, 1.997314453125, 2.10333251953125, 2.2093505859375, 2.31536865234375, 2.42138671875, 2.52740478515625, 2.6334228515625, 2.73944091796875, 2.845458984375, 2.95147705078125, 3.0574951171875, 3.16351318359375, 3.26953125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 3.0, 13.0, 28.0, 20.0, 42.0, 77.0, 123.0, 194.0, 270.0, 392.0, 628.0, 906.0, 1378.0, 2096.0, 3099.0, 5029.0, 8022.0, 12552.0, 20345.0, 33143.0, 57492.0, 106304.0, 230511.0, 275157.0, 125745.0, 66042.0, 37280.0, 22821.0, 14039.0, 8925.0, 5550.0, 3755.0, 2258.0, 1498.0, 928.0, 655.0, 430.0, 261.0, 201.0, 120.0, 85.0, 39.0, 32.0, 33.0, 16.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67041015625, -0.6495361328125, -0.628662109375, -0.6077880859375, -0.5869140625, -0.5660400390625, -0.545166015625, -0.5242919921875, -0.50341796875, -0.4825439453125, -0.461669921875, -0.4407958984375, -0.419921875, -0.3990478515625, -0.378173828125, -0.3572998046875, -0.33642578125, -0.3155517578125, -0.294677734375, -0.2738037109375, -0.2529296875, -0.2320556640625, -0.211181640625, -0.1903076171875, -0.16943359375, -0.1485595703125, -0.127685546875, -0.1068115234375, -0.0859375, -0.0650634765625, -0.044189453125, -0.0233154296875, -0.00244140625, 0.0184326171875, 0.039306640625, 0.0601806640625, 0.0810546875, 0.1019287109375, 0.122802734375, 0.1436767578125, 0.16455078125, 0.1854248046875, 0.206298828125, 0.2271728515625, 0.248046875, 0.2689208984375, 0.289794921875, 0.3106689453125, 0.33154296875, 0.3524169921875, 0.373291015625, 0.3941650390625, 0.4150390625, 0.4359130859375, 0.456787109375, 0.4776611328125, 0.49853515625, 0.5194091796875, 0.540283203125, 0.5611572265625, 0.58203125, 0.6029052734375, 0.623779296875, 0.6446533203125, 0.66552734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 12.0, 9.0, 12.0, 13.0, 11.0, 26.0, 25.0, 42.0, 29.0, 31.0, 44.0, 38.0, 32.0, 56.0, 57.0, 49.0, 1073.0, 58.0, 40.0, 39.0, 48.0, 31.0, 37.0, 31.0, 27.0, 28.0, 22.0, 18.0, 21.0, 10.0, 11.0, 10.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.72064208984375, -2.6365966796875, -2.55255126953125, -2.468505859375, -2.38446044921875, -2.3004150390625, -2.21636962890625, -2.13232421875, -2.04827880859375, -1.9642333984375, -1.88018798828125, -1.796142578125, -1.71209716796875, -1.6280517578125, -1.54400634765625, -1.4599609375, -1.37591552734375, -1.2918701171875, -1.20782470703125, -1.123779296875, -1.03973388671875, -0.9556884765625, -0.87164306640625, -0.78759765625, -0.70355224609375, -0.6195068359375, -0.53546142578125, -0.451416015625, -0.36737060546875, -0.2833251953125, -0.19927978515625, -0.115234375, -0.03118896484375, 0.0528564453125, 0.13690185546875, 0.220947265625, 0.30499267578125, 0.3890380859375, 0.47308349609375, 0.55712890625, 0.64117431640625, 0.7252197265625, 0.80926513671875, 0.893310546875, 0.97735595703125, 1.0614013671875, 1.14544677734375, 1.2294921875, 1.31353759765625, 1.3975830078125, 1.48162841796875, 1.565673828125, 1.64971923828125, 1.7337646484375, 1.81781005859375, 1.90185546875, 1.98590087890625, 2.0699462890625, 2.15399169921875, 2.238037109375, 2.32208251953125, 2.4061279296875, 2.49017333984375, 2.57421875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 11.0, 18.0, 22.0, 21.0, 38.0, 55.0, 95.0, 121.0, 213.0, 304.0, 470.0, 703.0, 1067.0, 1617.0, 2584.0, 4043.0, 6446.0, 10297.0, 16710.0, 28174.0, 49398.0, 92615.0, 206317.0, 1373086.0, 137841.0, 68475.0, 38144.0, 22234.0, 13306.0, 8332.0, 5037.0, 3262.0, 2113.0, 1328.0, 939.0, 550.0, 375.0, 248.0, 180.0, 104.0, 87.0, 51.0, 41.0, 18.0, 12.0, 10.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.74951171875, -0.7269821166992188, -0.7044525146484375, -0.6819229125976562, -0.659393310546875, -0.6368637084960938, -0.6143341064453125, -0.5918045043945312, -0.56927490234375, -0.5467453002929688, -0.5242156982421875, -0.5016860961914062, -0.479156494140625, -0.45662689208984375, -0.4340972900390625, -0.41156768798828125, -0.3890380859375, -0.36650848388671875, -0.3439788818359375, -0.32144927978515625, -0.298919677734375, -0.27639007568359375, -0.2538604736328125, -0.23133087158203125, -0.20880126953125, -0.18627166748046875, -0.1637420654296875, -0.14121246337890625, -0.118682861328125, -0.09615325927734375, -0.0736236572265625, -0.05109405517578125, -0.028564453125, -0.00603485107421875, 0.0164947509765625, 0.03902435302734375, 0.061553955078125, 0.08408355712890625, 0.1066131591796875, 0.12914276123046875, 0.15167236328125, 0.17420196533203125, 0.1967315673828125, 0.21926116943359375, 0.241790771484375, 0.26432037353515625, 0.2868499755859375, 0.30937957763671875, 0.3319091796875, 0.35443878173828125, 0.3769683837890625, 0.39949798583984375, 0.422027587890625, 0.44455718994140625, 0.4670867919921875, 0.48961639404296875, 0.51214599609375, 0.5346755981445312, 0.5572052001953125, 0.5797348022460938, 0.602264404296875, 0.6247940063476562, 0.6473236083984375, 0.6698532104492188, 0.6923828125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 0.0, 8.0, 9.0, 16.0, 15.0, 22.0, 18.0, 16.0, 24.0, 34.0, 26.0, 44.0, 46.0, 38.0, 59.0, 78.0, 50.0, 59.0, 68.0, 60.0, 46.0, 47.0, 40.0, 28.0, 24.0, 27.0, 16.0, 11.0, 17.0, 3.0, 4.0, 7.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0004138946533203125, -0.0004028528928756714, -0.0003918111324310303, -0.00038076937198638916, -0.00036972761154174805, -0.00035868585109710693, -0.0003476440906524658, -0.0003366023302078247, -0.0003255605697631836, -0.0003145188093185425, -0.00030347704887390137, -0.00029243528842926025, -0.00028139352798461914, -0.00027035176753997803, -0.0002593100070953369, -0.0002482682466506958, -0.0002372264862060547, -0.00022618472576141357, -0.00021514296531677246, -0.00020410120487213135, -0.00019305944442749023, -0.00018201768398284912, -0.000170975923538208, -0.0001599341630935669, -0.00014889240264892578, -0.00013785064220428467, -0.00012680888175964355, -0.00011576712131500244, -0.00010472536087036133, -9.368360042572021e-05, -8.26418399810791e-05, -7.160007953643799e-05, -6.0558319091796875e-05, -4.951655864715576e-05, -3.847479820251465e-05, -2.7433037757873535e-05, -1.6391277313232422e-05, -5.349516868591309e-06, 5.692243576049805e-06, 1.6734004020690918e-05, 2.777576446533203e-05, 3.8817524909973145e-05, 4.985928535461426e-05, 6.090104579925537e-05, 7.194280624389648e-05, 8.29845666885376e-05, 9.402632713317871e-05, 0.00010506808757781982, 0.00011610984802246094, 0.00012715160846710205, 0.00013819336891174316, 0.00014923512935638428, 0.0001602768898010254, 0.0001713186502456665, 0.00018236041069030762, 0.00019340217113494873, 0.00020444393157958984, 0.00021548569202423096, 0.00022652745246887207, 0.00023756921291351318, 0.0002486109733581543, 0.0002596527338027954, 0.0002706944942474365, 0.00028173625469207764, 0.00029277801513671875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 8.0, 6.0, 5.0, 11.0, 9.0, 6.0, 9.0, 11.0, 17.0, 42.0, 29.0, 24.0, 45.0, 73.0, 106.0, 161.0, 221.0, 429.0, 1074.0, 89148.0, 953838.0, 1781.0, 619.0, 240.0, 165.0, 104.0, 67.0, 66.0, 49.0, 42.0, 31.0, 20.0, 24.0, 22.0, 13.0, 5.0, 6.0, 7.0, 4.0, 4.0, 6.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006134033203125, -0.005899786949157715, -0.00566554069519043, -0.0054312944412231445, -0.005197048187255859, -0.004962801933288574, -0.004728555679321289, -0.004494309425354004, -0.004260063171386719, -0.004025816917419434, -0.0037915706634521484, -0.0035573244094848633, -0.003323078155517578, -0.003088831901550293, -0.002854585647583008, -0.0026203393936157227, -0.0023860931396484375, -0.0021518468856811523, -0.0019176006317138672, -0.001683354377746582, -0.0014491081237792969, -0.0012148618698120117, -0.0009806156158447266, -0.0007463693618774414, -0.0005121231079101562, -0.0002778768539428711, -4.363059997558594e-05, 0.00019061565399169922, 0.0004248619079589844, 0.0006591081619262695, 0.0008933544158935547, 0.0011276006698608398, 0.001361846923828125, 0.0015960931777954102, 0.0018303394317626953, 0.0020645856857299805, 0.0022988319396972656, 0.0025330781936645508, 0.002767324447631836, 0.003001570701599121, 0.0032358169555664062, 0.0034700632095336914, 0.0037043094635009766, 0.003938555717468262, 0.004172801971435547, 0.004407048225402832, 0.004641294479370117, 0.004875540733337402, 0.0051097869873046875, 0.005344033241271973, 0.005578279495239258, 0.005812525749206543, 0.006046772003173828, 0.006281018257141113, 0.0065152645111083984, 0.006749510765075684, 0.006983757019042969, 0.007218003273010254, 0.007452249526977539, 0.007686495780944824, 0.00792074203491211, 0.008154988288879395, 0.00838923454284668, 0.008623480796813965, 0.00885772705078125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 17.0, 29.0, 46.0, 102.0, 148.0, 166.0, 171.0, 132.0, 95.0, 57.0, 20.0, 8.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002174089604523033, -0.00020824294188059866, -0.00019907692330889404, -0.0001899109047371894, -0.00018074488616548479, -0.00017157886759378016, -0.00016241284902207553, -0.0001532468304503709, -0.00014408081187866628, -0.00013491479330696166, -0.00012574877473525703, -0.0001165827561635524, -0.00010741673759184778, -9.825071902014315e-05, -8.908470044843853e-05, -7.99186818767339e-05, -7.075266330502927e-05, -6.158664473332465e-05, -5.242062616162002e-05, -4.3254607589915395e-05, -3.408858901821077e-05, -2.4922570446506143e-05, -1.5756551874801517e-05, -6.5905333030968904e-06, 2.5754852686077356e-06, 1.1741503840312362e-05, 2.0907522412016988e-05, 3.0073540983721614e-05, 3.923955955542624e-05, 4.8405578127130866e-05, 5.757159669883549e-05, 6.673761527054012e-05, 7.590363384224474e-05, 8.506965241394937e-05, 9.4235670985654e-05, 0.00010340168955735862, 0.00011256770812906325, 0.00012173372670076787, 0.0001308997452724725, 0.00014006576384417713, 0.00014923178241588175, 0.00015839780098758638, 0.000167563819559291, 0.00017672983813099563, 0.00018589585670270026, 0.00019506187527440488, 0.0002042278938461095, 0.00021339391241781414, 0.00022255993098951876, 0.0002317259495612234, 0.00024089196813292801, 0.00025005798670463264, 0.00025922400527633727, 0.0002683900238480419, 0.0002775560424197465, 0.00028672206099145114, 0.00029588807956315577, 0.0003050540981348604, 0.000314220116706565, 0.00032338613527826965, 0.0003325521538499743, 0.0003417181724216789, 0.0003508841909933835, 0.00036005020956508815, 0.0003692162281367928]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 5.0, 6.0, 6.0, 7.0, 12.0, 6.0, 13.0, 11.0, 14.0, 16.0, 15.0, 25.0, 27.0, 35.0, 33.0, 26.0, 47.0, 34.0, 35.0, 45.0, 46.0, 34.0, 40.0, 51.0, 22.0, 39.0, 29.0, 39.0, 37.0, 38.0, 30.0, 26.0, 31.0, 12.0, 18.0, 19.0, 12.0, 8.0, 17.0, 6.0, 3.0, 3.0, 1.0, 5.0, 7.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.0001887679100036621, -0.00018302258104085922, -0.00017727725207805634, -0.00017153192311525345, -0.00016578659415245056, -0.00016004126518964767, -0.0001542959362268448, -0.0001485506072640419, -0.00014280527830123901, -0.00013705994933843613, -0.00013131462037563324, -0.00012556929141283035, -0.00011982396245002747, -0.00011407863348722458, -0.00010833330452442169, -0.0001025879755616188, -9.684264659881592e-05, -9.109731763601303e-05, -8.535198867321014e-05, -7.960665971040726e-05, -7.386133074760437e-05, -6.811600178480148e-05, -6.23706728219986e-05, -5.662534385919571e-05, -5.088001489639282e-05, -4.5134685933589935e-05, -3.938935697078705e-05, -3.364402800798416e-05, -2.7898699045181274e-05, -2.2153370082378387e-05, -1.64080411195755e-05, -1.0662712156772614e-05, -4.9173831939697266e-06, 8.279457688331604e-07, 6.573274731636047e-06, 1.2318603694438934e-05, 1.806393265724182e-05, 2.3809261620044708e-05, 2.9554590582847595e-05, 3.529991954565048e-05, 4.104524850845337e-05, 4.6790577471256256e-05, 5.253590643405914e-05, 5.828123539686203e-05, 6.402656435966492e-05, 6.97718933224678e-05, 7.551722228527069e-05, 8.126255124807358e-05, 8.700788021087646e-05, 9.275320917367935e-05, 9.849853813648224e-05, 0.00010424386709928513, 0.00010998919606208801, 0.0001157345250248909, 0.00012147985398769379, 0.00012722518295049667, 0.00013297051191329956, 0.00013871584087610245, 0.00014446116983890533, 0.00015020649880170822, 0.0001559518277645111, 0.000161697156727314, 0.00016744248569011688, 0.00017318781465291977, 0.00017893314361572266]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 10.0, 5.0, 9.0, 7.0, 10.0, 3.0, 20.0, 14.0, 20.0, 20.0, 26.0, 29.0, 21.0, 24.0, 35.0, 35.0, 31.0, 43.0, 35.0, 38.0, 39.0, 36.0, 36.0, 49.0, 48.0, 37.0, 35.0, 30.0, 31.0, 26.0, 28.0, 22.0, 22.0, 20.0, 19.0, 16.0, 15.0, 16.0, 10.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.515625, -3.40960693359375, -3.3035888671875, -3.19757080078125, -3.091552734375, -2.98553466796875, -2.8795166015625, -2.77349853515625, -2.66748046875, -2.56146240234375, -2.4554443359375, -2.34942626953125, -2.243408203125, -2.13739013671875, -2.0313720703125, -1.92535400390625, -1.8193359375, -1.71331787109375, -1.6072998046875, -1.50128173828125, -1.395263671875, -1.28924560546875, -1.1832275390625, -1.07720947265625, -0.97119140625, -0.86517333984375, -0.7591552734375, -0.65313720703125, -0.547119140625, -0.44110107421875, -0.3350830078125, -0.22906494140625, -0.123046875, -0.01702880859375, 0.0889892578125, 0.19500732421875, 0.301025390625, 0.40704345703125, 0.5130615234375, 0.61907958984375, 0.72509765625, 0.83111572265625, 0.9371337890625, 1.04315185546875, 1.149169921875, 1.25518798828125, 1.3612060546875, 1.46722412109375, 1.5732421875, 1.67926025390625, 1.7852783203125, 1.89129638671875, 1.997314453125, 2.10333251953125, 2.2093505859375, 2.31536865234375, 2.42138671875, 2.52740478515625, 2.6334228515625, 2.73944091796875, 2.845458984375, 2.95147705078125, 3.0574951171875, 3.16351318359375, 3.26953125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 7.0, 8.0, 12.0, 8.0, 5.0, 11.0, 25.0, 35.0, 37.0, 52.0, 90.0, 152.0, 295.0, 609.0, 1389.0, 3409.0, 8644.0, 21195.0, 52179.0, 136748.0, 326092.0, 300045.0, 118911.0, 46449.0, 18997.0, 7566.0, 3033.0, 1291.0, 569.0, 266.0, 125.0, 89.0, 63.0, 30.0, 25.0, 16.0, 10.0, 20.0, 11.0, 3.0, 5.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0], "bins": [-3.86328125, -3.7459716796875, -3.628662109375, -3.5113525390625, -3.39404296875, -3.2767333984375, -3.159423828125, -3.0421142578125, -2.9248046875, -2.8074951171875, -2.690185546875, -2.5728759765625, -2.45556640625, -2.3382568359375, -2.220947265625, -2.1036376953125, -1.986328125, -1.8690185546875, -1.751708984375, -1.6343994140625, -1.51708984375, -1.3997802734375, -1.282470703125, -1.1651611328125, -1.0478515625, -0.9305419921875, -0.813232421875, -0.6959228515625, -0.57861328125, -0.4613037109375, -0.343994140625, -0.2266845703125, -0.109375, 0.0079345703125, 0.125244140625, 0.2425537109375, 0.35986328125, 0.4771728515625, 0.594482421875, 0.7117919921875, 0.8291015625, 0.9464111328125, 1.063720703125, 1.1810302734375, 1.29833984375, 1.4156494140625, 1.532958984375, 1.6502685546875, 1.767578125, 1.8848876953125, 2.002197265625, 2.1195068359375, 2.23681640625, 2.3541259765625, 2.471435546875, 2.5887451171875, 2.7060546875, 2.8233642578125, 2.940673828125, 3.0579833984375, 3.17529296875, 3.2926025390625, 3.409912109375, 3.5272216796875, 3.64453125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 8.0, 3.0, 6.0, 9.0, 8.0, 12.0, 18.0, 11.0, 21.0, 17.0, 13.0, 21.0, 22.0, 46.0, 42.0, 33.0, 59.0, 54.0, 68.0, 162.0, 1378.0, 416.0, 146.0, 80.0, 53.0, 37.0, 43.0, 36.0, 35.0, 27.0, 28.0, 20.0, 20.0, 14.0, 15.0, 12.0, 6.0, 10.0, 12.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.5078125, -11.13623046875, -10.7646484375, -10.39306640625, -10.021484375, -9.64990234375, -9.2783203125, -8.90673828125, -8.53515625, -8.16357421875, -7.7919921875, -7.42041015625, -7.048828125, -6.67724609375, -6.3056640625, -5.93408203125, -5.5625, -5.19091796875, -4.8193359375, -4.44775390625, -4.076171875, -3.70458984375, -3.3330078125, -2.96142578125, -2.58984375, -2.21826171875, -1.8466796875, -1.47509765625, -1.103515625, -0.73193359375, -0.3603515625, 0.01123046875, 0.3828125, 0.75439453125, 1.1259765625, 1.49755859375, 1.869140625, 2.24072265625, 2.6123046875, 2.98388671875, 3.35546875, 3.72705078125, 4.0986328125, 4.47021484375, 4.841796875, 5.21337890625, 5.5849609375, 5.95654296875, 6.328125, 6.69970703125, 7.0712890625, 7.44287109375, 7.814453125, 8.18603515625, 8.5576171875, 8.92919921875, 9.30078125, 9.67236328125, 10.0439453125, 10.41552734375, 10.787109375, 11.15869140625, 11.5302734375, 11.90185546875, 12.2734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 10.0, 17.0, 22.0, 38.0, 31.0, 50.0, 87.0, 148.0, 267.0, 508.0, 1287.0, 31112.0, 3101959.0, 8069.0, 999.0, 467.0, 202.0, 127.0, 76.0, 57.0, 41.0, 36.0, 19.0, 16.0, 20.0, 5.0, 8.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53125, -28.3681640625, -27.205078125, -26.0419921875, -24.87890625, -23.7158203125, -22.552734375, -21.3896484375, -20.2265625, -19.0634765625, -17.900390625, -16.7373046875, -15.57421875, -14.4111328125, -13.248046875, -12.0849609375, -10.921875, -9.7587890625, -8.595703125, -7.4326171875, -6.26953125, -5.1064453125, -3.943359375, -2.7802734375, -1.6171875, -0.4541015625, 0.708984375, 1.8720703125, 3.03515625, 4.1982421875, 5.361328125, 6.5244140625, 7.6875, 8.8505859375, 10.013671875, 11.1767578125, 12.33984375, 13.5029296875, 14.666015625, 15.8291015625, 16.9921875, 18.1552734375, 19.318359375, 20.4814453125, 21.64453125, 22.8076171875, 23.970703125, 25.1337890625, 26.296875, 27.4599609375, 28.623046875, 29.7861328125, 30.94921875, 32.1123046875, 33.275390625, 34.4384765625, 35.6015625, 36.7646484375, 37.927734375, 39.0908203125, 40.25390625, 41.4169921875, 42.580078125, 43.7431640625, 44.90625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 77.0, 730.0, 202.0, 6.0, 2.0, 2.0], "bins": [-184.623779296875, -181.52517700195312, -178.42657470703125, -175.32798767089844, -172.22938537597656, -169.1307830810547, -166.03219604492188, -162.93359375, -159.83499145507812, -156.73638916015625, -153.63778686523438, -150.53919982910156, -147.4405975341797, -144.3419952392578, -141.243408203125, -138.14480590820312, -135.04620361328125, -131.94760131835938, -128.8489990234375, -125.75041198730469, -122.65180969238281, -119.55320739746094, -116.4546127319336, -113.35601806640625, -110.25741577148438, -107.1588134765625, -104.06021881103516, -100.96162414550781, -97.86302185058594, -94.76441955566406, -91.66582489013672, -88.56723022460938, -85.46862030029297, -82.37002563476562, -79.27142333984375, -76.17282104492188, -73.07422637939453, -69.97563171386719, -66.87702941894531, -63.7784309387207, -60.679832458496094, -57.581233978271484, -54.482635498046875, -51.384037017822266, -48.285438537597656, -45.18684005737305, -42.08824157714844, -38.98964309692383, -35.89104461669922, -32.79244613647461, -29.69384765625, -26.59524917602539, -23.49665069580078, -20.398052215576172, -17.299453735351562, -14.200855255126953, -11.102258682250977, -8.003660202026367, -4.905061721801758, -1.8064632415771484, 1.292135238647461, 4.39073371887207, 7.48933219909668, 10.587930679321289, 13.686529159545898]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 4.0, 6.0, 12.0, 13.0, 11.0, 9.0, 18.0, 24.0, 29.0, 30.0, 24.0, 37.0, 33.0, 41.0, 44.0, 37.0, 43.0, 44.0, 39.0, 34.0, 45.0, 39.0, 42.0, 36.0, 40.0, 33.0, 32.0, 22.0, 19.0, 18.0, 25.0, 23.0, 9.0, 12.0, 13.0, 9.0, 13.0, 6.0, 5.0, 4.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.117712020874023, -28.188800811767578, -27.2598876953125, -26.330976486206055, -25.40206527709961, -24.47315216064453, -23.544240951538086, -22.61532974243164, -21.686416625976562, -20.757505416870117, -19.82859230041504, -18.899681091308594, -17.97076988220215, -17.04185676574707, -16.112945556640625, -15.184033393859863, -14.255122184753418, -13.326210021972656, -12.397298812866211, -11.46838665008545, -10.539474487304688, -9.610563278198242, -8.68165111541748, -7.752738952636719, -6.823827266693115, -5.894915580749512, -4.96600341796875, -4.0370917320251465, -3.108179807662964, -2.1792678833007812, -1.2503561973571777, -0.321444034576416, 0.6074676513671875, 1.5363795757293701, 2.4652915000915527, 3.3942031860351562, 4.323115348815918, 5.2520270347595215, 6.180938720703125, 7.109850883483887, 8.038763046264648, 8.96767520904541, 9.896586418151855, 10.825498580932617, 11.754410743713379, 12.68332290649414, 13.612234115600586, 14.541146278381348, 15.470057487487793, 16.398969650268555, 17.327880859375, 18.256793975830078, 19.185705184936523, 20.11461639404297, 21.043529510498047, 21.972440719604492, 22.901351928710938, 23.830263137817383, 24.75917625427246, 25.688087463378906, 26.61699867248535, 27.54591178894043, 28.474822998046875, 29.403736114501953, 30.3326473236084]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 4.0, 8.0, 12.0, 13.0, 16.0, 10.0, 29.0, 17.0, 15.0, 25.0, 25.0, 31.0, 26.0, 36.0, 37.0, 27.0, 59.0, 40.0, 49.0, 40.0, 34.0, 34.0, 38.0, 36.0, 31.0, 37.0, 37.0, 36.0, 21.0, 30.0, 22.0, 21.0, 9.0, 14.0, 19.0, 12.0, 6.0, 6.0, 7.0, 7.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-3.990234375, -3.873260498046875, -3.75628662109375, -3.639312744140625, -3.5223388671875, -3.405364990234375, -3.28839111328125, -3.171417236328125, -3.054443359375, -2.937469482421875, -2.82049560546875, -2.703521728515625, -2.5865478515625, -2.469573974609375, -2.35260009765625, -2.235626220703125, -2.11865234375, -2.001678466796875, -1.88470458984375, -1.767730712890625, -1.6507568359375, -1.533782958984375, -1.41680908203125, -1.299835205078125, -1.182861328125, -1.065887451171875, -0.94891357421875, -0.831939697265625, -0.7149658203125, -0.597991943359375, -0.48101806640625, -0.364044189453125, -0.2470703125, -0.130096435546875, -0.01312255859375, 0.103851318359375, 0.2208251953125, 0.337799072265625, 0.45477294921875, 0.571746826171875, 0.688720703125, 0.805694580078125, 0.92266845703125, 1.039642333984375, 1.1566162109375, 1.273590087890625, 1.39056396484375, 1.507537841796875, 1.62451171875, 1.741485595703125, 1.85845947265625, 1.975433349609375, 2.0924072265625, 2.209381103515625, 2.32635498046875, 2.443328857421875, 2.560302734375, 2.677276611328125, 2.79425048828125, 2.911224365234375, 3.0281982421875, 3.145172119140625, 3.26214599609375, 3.379119873046875, 3.49609375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 5.0, 9.0, 10.0, 9.0, 6.0, 11.0, 15.0, 21.0, 18.0, 17.0, 28.0, 34.0, 56.0, 64.0, 72.0, 107.0, 167.0, 343.0, 1573.0, 69515.0, 2964696.0, 1143881.0, 12046.0, 764.0, 224.0, 151.0, 83.0, 69.0, 68.0, 40.0, 31.0, 23.0, 24.0, 18.0, 17.0, 13.0, 15.0, 8.0, 12.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9375, -12.53076171875, -12.1240234375, -11.71728515625, -11.310546875, -10.90380859375, -10.4970703125, -10.09033203125, -9.68359375, -9.27685546875, -8.8701171875, -8.46337890625, -8.056640625, -7.64990234375, -7.2431640625, -6.83642578125, -6.4296875, -6.02294921875, -5.6162109375, -5.20947265625, -4.802734375, -4.39599609375, -3.9892578125, -3.58251953125, -3.17578125, -2.76904296875, -2.3623046875, -1.95556640625, -1.548828125, -1.14208984375, -0.7353515625, -0.32861328125, 0.078125, 0.48486328125, 0.8916015625, 1.29833984375, 1.705078125, 2.11181640625, 2.5185546875, 2.92529296875, 3.33203125, 3.73876953125, 4.1455078125, 4.55224609375, 4.958984375, 5.36572265625, 5.7724609375, 6.17919921875, 6.5859375, 6.99267578125, 7.3994140625, 7.80615234375, 8.212890625, 8.61962890625, 9.0263671875, 9.43310546875, 9.83984375, 10.24658203125, 10.6533203125, 11.06005859375, 11.466796875, 11.87353515625, 12.2802734375, 12.68701171875, 13.09375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 9.0, 27.0, 19.0, 43.0, 71.0, 73.0, 103.0, 210.0, 302.0, 411.0, 574.0, 620.0, 530.0, 374.0, 267.0, 165.0, 100.0, 63.0, 43.0, 24.0, 4.0, 11.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.03125, -11.765625, -11.5, -11.234375, -10.96875, -10.703125, -10.4375, -10.171875, -9.90625, -9.640625, -9.375, -9.109375, -8.84375, -8.578125, -8.3125, -8.046875, -7.78125, -7.515625, -7.25, -6.984375, -6.71875, -6.453125, -6.1875, -5.921875, -5.65625, -5.390625, -5.125, -4.859375, -4.59375, -4.328125, -4.0625, -3.796875, -3.53125, -3.265625, -3.0, -2.734375, -2.46875, -2.203125, -1.9375, -1.671875, -1.40625, -1.140625, -0.875, -0.609375, -0.34375, -0.078125, 0.1875, 0.453125, 0.71875, 0.984375, 1.25, 1.515625, 1.78125, 2.046875, 2.3125, 2.578125, 2.84375, 3.109375, 3.375, 3.640625, 3.90625, 4.171875, 4.4375, 4.703125, 4.96875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 5.0, 14.0, 8.0, 17.0, 24.0, 46.0, 50.0, 84.0, 139.0, 195.0, 313.0, 500.0, 1223.0, 16487.0, 3858583.0, 312329.0, 2390.0, 707.0, 380.0, 241.0, 160.0, 130.0, 92.0, 55.0, 36.0, 26.0, 18.0, 9.0, 14.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.0625, -15.205078125, -14.34765625, -13.490234375, -12.6328125, -11.775390625, -10.91796875, -10.060546875, -9.203125, -8.345703125, -7.48828125, -6.630859375, -5.7734375, -4.916015625, -4.05859375, -3.201171875, -2.34375, -1.486328125, -0.62890625, 0.228515625, 1.0859375, 1.943359375, 2.80078125, 3.658203125, 4.515625, 5.373046875, 6.23046875, 7.087890625, 7.9453125, 8.802734375, 9.66015625, 10.517578125, 11.375, 12.232421875, 13.08984375, 13.947265625, 14.8046875, 15.662109375, 16.51953125, 17.376953125, 18.234375, 19.091796875, 19.94921875, 20.806640625, 21.6640625, 22.521484375, 23.37890625, 24.236328125, 25.09375, 25.951171875, 26.80859375, 27.666015625, 28.5234375, 29.380859375, 30.23828125, 31.095703125, 31.953125, 32.810546875, 33.66796875, 34.525390625, 35.3828125, 36.240234375, 37.09765625, 37.955078125, 38.8125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 52.0, 519.0, 401.0, 41.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.8626251220703, -188.92396545410156, -184.98529052734375, -181.046630859375, -177.10797119140625, -173.16929626464844, -169.2306365966797, -165.29196166992188, -161.35330200195312, -157.41464233398438, -153.47596740722656, -149.5373077392578, -145.5986328125, -141.65997314453125, -137.7213134765625, -133.7826385498047, -129.84397888183594, -125.90531158447266, -121.96664428710938, -118.02798461914062, -114.08931732177734, -110.15065002441406, -106.21199035644531, -102.27332305908203, -98.33465576171875, -94.39598846435547, -90.45732116699219, -86.51866149902344, -82.57999420166016, -78.64132690429688, -74.70266723632812, -70.76399993896484, -66.8253402709961, -62.88667297363281, -58.9480094909668, -55.00934600830078, -51.0706787109375, -47.13201141357422, -43.1933479309082, -39.25468444824219, -35.316017150878906, -31.377351760864258, -27.43868637084961, -23.50002098083496, -19.561355590820312, -15.622690200805664, -11.684024810791016, -7.745359420776367, -3.8066940307617188, 0.1319713592529297, 4.070636749267578, 8.009302139282227, 11.947967529296875, 15.886632919311523, 19.825298309326172, 23.76396369934082, 27.70262908935547, 31.641294479370117, 35.579959869384766, 39.51862335205078, 43.45729064941406, 47.395957946777344, 51.33462142944336, 55.273284912109375, 59.211952209472656]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 1.0, 7.0, 4.0, 9.0, 11.0, 12.0, 12.0, 12.0, 19.0, 33.0, 35.0, 36.0, 20.0, 42.0, 39.0, 37.0, 41.0, 47.0, 48.0, 34.0, 50.0, 53.0, 39.0, 43.0, 52.0, 29.0, 31.0, 33.0, 18.0, 31.0, 25.0, 15.0, 12.0, 14.0, 9.0, 10.0, 7.0, 9.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-25.860363006591797, -25.138200759887695, -24.416038513183594, -23.693878173828125, -22.971715927124023, -22.249553680419922, -21.52739143371582, -20.80522918701172, -20.08306884765625, -19.36090660095215, -18.638744354248047, -17.916584014892578, -17.194421768188477, -16.472259521484375, -15.750097274780273, -15.027935981750488, -14.305773735046387, -13.583611488342285, -12.8614501953125, -12.139287948608398, -11.417126655578613, -10.694964408874512, -9.972803115844727, -9.250640869140625, -8.528478622436523, -7.80631685256958, -7.084155082702637, -6.361992835998535, -5.63983154296875, -4.917669296264648, -4.195507526397705, -3.4733457565307617, -2.7511844635009766, -2.029022693634033, -1.3068608045578003, -0.5846989154815674, 0.13746285438537598, 0.8596246242523193, 1.5817866325378418, 2.303948402404785, 3.0261101722717285, 3.748271942138672, 4.470433712005615, 5.192595481872559, 5.91475772857666, 6.636919021606445, 7.359081268310547, 8.081243515014648, 8.803404808044434, 9.525567054748535, 10.24772834777832, 10.969890594482422, 11.692051887512207, 12.414214134216309, 13.136375427246094, 13.858537673950195, 14.580699920654297, 15.302862167358398, 16.0250244140625, 16.74718475341797, 17.46934700012207, 18.191509246826172, 18.913671493530273, 19.635833740234375, 20.357994079589844]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 5.0, 6.0, 13.0, 15.0, 13.0, 17.0, 17.0, 23.0, 38.0, 36.0, 48.0, 49.0, 38.0, 35.0, 53.0, 48.0, 45.0, 37.0, 31.0, 34.0, 35.0, 29.0, 33.0, 41.0, 44.0, 24.0, 30.0, 26.0, 19.0, 19.0, 23.0, 13.0, 8.0, 10.0, 3.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.51171875, -4.388824462890625, -4.26593017578125, -4.143035888671875, -4.0201416015625, -3.897247314453125, -3.77435302734375, -3.651458740234375, -3.528564453125, -3.405670166015625, -3.28277587890625, -3.159881591796875, -3.0369873046875, -2.914093017578125, -2.79119873046875, -2.668304443359375, -2.54541015625, -2.422515869140625, -2.29962158203125, -2.176727294921875, -2.0538330078125, -1.930938720703125, -1.80804443359375, -1.685150146484375, -1.562255859375, -1.439361572265625, -1.31646728515625, -1.193572998046875, -1.0706787109375, -0.947784423828125, -0.82489013671875, -0.701995849609375, -0.5791015625, -0.456207275390625, -0.33331298828125, -0.210418701171875, -0.0875244140625, 0.035369873046875, 0.15826416015625, 0.281158447265625, 0.404052734375, 0.526947021484375, 0.64984130859375, 0.772735595703125, 0.8956298828125, 1.018524169921875, 1.14141845703125, 1.264312744140625, 1.38720703125, 1.510101318359375, 1.63299560546875, 1.755889892578125, 1.8787841796875, 2.001678466796875, 2.12457275390625, 2.247467041015625, 2.370361328125, 2.493255615234375, 2.61614990234375, 2.739044189453125, 2.8619384765625, 2.984832763671875, 3.10772705078125, 3.230621337890625, 3.353515625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 11.0, 16.0, 20.0, 18.0, 31.0, 68.0, 94.0, 124.0, 223.0, 308.0, 491.0, 591.0, 1013.0, 1415.0, 2239.0, 3340.0, 5172.0, 8046.0, 12707.0, 20244.0, 34400.0, 60229.0, 108519.0, 227893.0, 269785.0, 125269.0, 66140.0, 38119.0, 22790.0, 13873.0, 8703.0, 5658.0, 3721.0, 2397.0, 1582.0, 1091.0, 746.0, 491.0, 327.0, 233.0, 118.0, 112.0, 50.0, 55.0, 28.0, 22.0, 22.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7119140625, -0.6904067993164062, -0.6688995361328125, -0.6473922729492188, -0.625885009765625, -0.6043777465820312, -0.5828704833984375, -0.5613632202148438, -0.53985595703125, -0.5183486938476562, -0.4968414306640625, -0.47533416748046875, -0.453826904296875, -0.43231964111328125, -0.4108123779296875, -0.38930511474609375, -0.3677978515625, -0.34629058837890625, -0.3247833251953125, -0.30327606201171875, -0.281768798828125, -0.26026153564453125, -0.2387542724609375, -0.21724700927734375, -0.19573974609375, -0.17423248291015625, -0.1527252197265625, -0.13121795654296875, -0.109710693359375, -0.08820343017578125, -0.0666961669921875, -0.04518890380859375, -0.023681640625, -0.00217437744140625, 0.0193328857421875, 0.04084014892578125, 0.062347412109375, 0.08385467529296875, 0.1053619384765625, 0.12686920166015625, 0.14837646484375, 0.16988372802734375, 0.1913909912109375, 0.21289825439453125, 0.234405517578125, 0.25591278076171875, 0.2774200439453125, 0.29892730712890625, 0.3204345703125, 0.34194183349609375, 0.3634490966796875, 0.38495635986328125, 0.406463623046875, 0.42797088623046875, 0.4494781494140625, 0.47098541259765625, 0.49249267578125, 0.5139999389648438, 0.5355072021484375, 0.5570144653320312, 0.578521728515625, 0.6000289916992188, 0.6215362548828125, 0.6430435180664062, 0.66455078125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 9.0, 6.0, 5.0, 8.0, 10.0, 9.0, 16.0, 12.0, 15.0, 16.0, 32.0, 18.0, 22.0, 27.0, 35.0, 32.0, 36.0, 34.0, 44.0, 37.0, 30.0, 1072.0, 35.0, 37.0, 39.0, 28.0, 38.0, 29.0, 29.0, 32.0, 27.0, 22.0, 20.0, 20.0, 23.0, 18.0, 12.0, 15.0, 18.0, 8.0, 8.0, 10.0, 5.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-2.1328125, -2.067962646484375, -2.00311279296875, -1.938262939453125, -1.8734130859375, -1.808563232421875, -1.74371337890625, -1.678863525390625, -1.614013671875, -1.549163818359375, -1.48431396484375, -1.419464111328125, -1.3546142578125, -1.289764404296875, -1.22491455078125, -1.160064697265625, -1.09521484375, -1.030364990234375, -0.96551513671875, -0.900665283203125, -0.8358154296875, -0.770965576171875, -0.70611572265625, -0.641265869140625, -0.576416015625, -0.511566162109375, -0.44671630859375, -0.381866455078125, -0.3170166015625, -0.252166748046875, -0.18731689453125, -0.122467041015625, -0.0576171875, 0.007232666015625, 0.07208251953125, 0.136932373046875, 0.2017822265625, 0.266632080078125, 0.33148193359375, 0.396331787109375, 0.461181640625, 0.526031494140625, 0.59088134765625, 0.655731201171875, 0.7205810546875, 0.785430908203125, 0.85028076171875, 0.915130615234375, 0.97998046875, 1.044830322265625, 1.10968017578125, 1.174530029296875, 1.2393798828125, 1.304229736328125, 1.36907958984375, 1.433929443359375, 1.498779296875, 1.563629150390625, 1.62847900390625, 1.693328857421875, 1.7581787109375, 1.823028564453125, 1.88787841796875, 1.952728271484375, 2.017578125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 8.0, 10.0, 29.0, 48.0, 67.0, 69.0, 101.0, 193.0, 261.0, 374.0, 521.0, 735.0, 1092.0, 1587.0, 2173.0, 3001.0, 4478.0, 6365.0, 9204.0, 14080.0, 20772.0, 32225.0, 52201.0, 87497.0, 170813.0, 1333718.0, 143218.0, 77321.0, 46323.0, 29155.0, 18954.0, 12593.0, 8440.0, 5884.0, 4102.0, 2749.0, 2101.0, 1400.0, 980.0, 687.0, 475.0, 373.0, 256.0, 157.0, 102.0, 72.0, 62.0, 34.0, 25.0, 16.0, 7.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.57421875, -0.556488037109375, -0.53875732421875, -0.521026611328125, -0.5032958984375, -0.485565185546875, -0.46783447265625, -0.450103759765625, -0.432373046875, -0.414642333984375, -0.39691162109375, -0.379180908203125, -0.3614501953125, -0.343719482421875, -0.32598876953125, -0.308258056640625, -0.29052734375, -0.272796630859375, -0.25506591796875, -0.237335205078125, -0.2196044921875, -0.201873779296875, -0.18414306640625, -0.166412353515625, -0.148681640625, -0.130950927734375, -0.11322021484375, -0.095489501953125, -0.0777587890625, -0.060028076171875, -0.04229736328125, -0.024566650390625, -0.0068359375, 0.010894775390625, 0.02862548828125, 0.046356201171875, 0.0640869140625, 0.081817626953125, 0.09954833984375, 0.117279052734375, 0.135009765625, 0.152740478515625, 0.17047119140625, 0.188201904296875, 0.2059326171875, 0.223663330078125, 0.24139404296875, 0.259124755859375, 0.27685546875, 0.294586181640625, 0.31231689453125, 0.330047607421875, 0.3477783203125, 0.365509033203125, 0.38323974609375, 0.400970458984375, 0.418701171875, 0.436431884765625, 0.45416259765625, 0.471893310546875, 0.4896240234375, 0.507354736328125, 0.52508544921875, 0.542816162109375, 0.560546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 1.0, 2.0, 5.0, 10.0, 15.0, 18.0, 14.0, 19.0, 13.0, 26.0, 28.0, 33.0, 40.0, 43.0, 50.0, 43.0, 70.0, 66.0, 67.0, 50.0, 41.0, 59.0, 45.0, 57.0, 34.0, 32.0, 17.0, 22.0, 12.0, 10.0, 10.0, 5.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0004227161407470703, -0.0004104338586330414, -0.00039815157651901245, -0.0003858692944049835, -0.0003735870122909546, -0.00036130473017692566, -0.00034902244806289673, -0.0003367401659488678, -0.00032445788383483887, -0.00031217560172080994, -0.000299893319606781, -0.0002876110374927521, -0.00027532875537872314, -0.0002630464732646942, -0.0002507641911506653, -0.00023848190903663635, -0.00022619962692260742, -0.0002139173448085785, -0.00020163506269454956, -0.00018935278058052063, -0.0001770704984664917, -0.00016478821635246277, -0.00015250593423843384, -0.0001402236521244049, -0.00012794137001037598, -0.00011565908789634705, -0.00010337680578231812, -9.109452366828918e-05, -7.881224155426025e-05, -6.652995944023132e-05, -5.424767732620239e-05, -4.196539521217346e-05, -2.968311309814453e-05, -1.74008309841156e-05, -5.11854887008667e-06, 7.163733243942261e-06, 1.944601535797119e-05, 3.172829747200012e-05, 4.401057958602905e-05, 5.6292861700057983e-05, 6.857514381408691e-05, 8.085742592811584e-05, 9.313970804214478e-05, 0.0001054219901561737, 0.00011770427227020264, 0.00012998655438423157, 0.0001422688364982605, 0.00015455111861228943, 0.00016683340072631836, 0.0001791156828403473, 0.00019139796495437622, 0.00020368024706840515, 0.00021596252918243408, 0.000228244811296463, 0.00024052709341049194, 0.0002528093755245209, 0.0002650916576385498, 0.00027737393975257874, 0.00028965622186660767, 0.0003019385039806366, 0.00031422078609466553, 0.00032650306820869446, 0.0003387853503227234, 0.0003510676324367523, 0.00036334991455078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 8.0, 8.0, 10.0, 13.0, 12.0, 18.0, 18.0, 22.0, 30.0, 39.0, 63.0, 74.0, 114.0, 179.0, 312.0, 554.0, 2123.0, 1018539.0, 24327.0, 921.0, 378.0, 210.0, 148.0, 88.0, 79.0, 57.0, 36.0, 30.0, 27.0, 28.0, 15.0, 21.0, 13.0, 10.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00717926025390625, -0.0069200992584228516, -0.006660938262939453, -0.006401777267456055, -0.006142616271972656, -0.005883455276489258, -0.005624294281005859, -0.005365133285522461, -0.0051059722900390625, -0.004846811294555664, -0.004587650299072266, -0.004328489303588867, -0.004069328308105469, -0.0038101673126220703, -0.003551006317138672, -0.0032918453216552734, -0.003032684326171875, -0.0027735233306884766, -0.002514362335205078, -0.0022552013397216797, -0.0019960403442382812, -0.0017368793487548828, -0.0014777183532714844, -0.001218557357788086, -0.0009593963623046875, -0.0007002353668212891, -0.0004410743713378906, -0.0001819133758544922, 7.724761962890625e-05, 0.0003364086151123047, 0.0005955696105957031, 0.0008547306060791016, 0.0011138916015625, 0.0013730525970458984, 0.0016322135925292969, 0.0018913745880126953, 0.0021505355834960938, 0.002409696578979492, 0.0026688575744628906, 0.002928018569946289, 0.0031871795654296875, 0.003446340560913086, 0.0037055015563964844, 0.003964662551879883, 0.004223823547363281, 0.00448298454284668, 0.004742145538330078, 0.0050013065338134766, 0.005260467529296875, 0.0055196285247802734, 0.005778789520263672, 0.00603795051574707, 0.006297111511230469, 0.006556272506713867, 0.006815433502197266, 0.007074594497680664, 0.0073337554931640625, 0.007592916488647461, 0.00785207748413086, 0.008111238479614258, 0.008370399475097656, 0.008629560470581055, 0.008888721466064453, 0.009147882461547852, 0.00940704345703125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 12.0, 51.0, 151.0, 318.0, 270.0, 146.0, 55.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005862560938112438, -0.0005699560279026628, -0.0005536559037864208, -0.0005373557796701789, -0.0005210557137615979, -0.0005047556478530169, -0.0004884555237367749, -0.00047215542872436345, -0.00045585533371195197, -0.0004395552386995405, -0.000423255143687129, -0.00040695504867471755, -0.00039065495366230607, -0.0003743548586498946, -0.0003580547636374831, -0.00034175466862507164, -0.00032545457361266017, -0.0003091544786002487, -0.0002928543835878372, -0.00027655428857542574, -0.00026025419356301427, -0.0002439540985506028, -0.00022765400353819132, -0.00021135390852577984, -0.00019505381351336837, -0.0001787537185009569, -0.00016245362348854542, -0.00014615352847613394, -0.00012985343346372247, -0.00011355333845131099, -9.725324343889952e-05, -8.095314842648804e-05, -6.465302431024611e-05, -4.8352929297834635e-05, -3.205283428542316e-05, -1.5752739273011684e-05, 5.473557393997908e-07, 1.6847450751811266e-05, 3.314754576422274e-05, 4.9447640776634216e-05, 6.574773578904569e-05, 8.204783080145717e-05, 9.834792581386864e-05, 0.00011464802082628012, 0.0001309481158386916, 0.00014724821085110307, 0.00016354830586351454, 0.00017984840087592602, 0.0001961484958883375, 0.00021244859090074897, 0.00022874868591316044, 0.0002450487809255719, 0.0002613488759379834, 0.00027764897095039487, 0.00029394906596280634, 0.0003102491609752178, 0.0003265492559876293, 0.00034284935100004077, 0.00035914944601245224, 0.0003754495410248637, 0.0003917496360372752, 0.00040804973104968667, 0.00042434982606209815, 0.0004406499210745096, 0.0004569500160869211]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 11.0, 11.0, 21.0, 28.0, 19.0, 31.0, 34.0, 44.0, 37.0, 48.0, 45.0, 41.0, 38.0, 50.0, 36.0, 49.0, 51.0, 42.0, 42.0, 54.0, 44.0, 18.0, 21.0, 30.0, 22.0, 23.0, 17.0, 17.0, 12.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025659799575805664, -0.0002493634819984436, -0.00024212896823883057, -0.00023489445447921753, -0.0002276599407196045, -0.00022042542695999146, -0.00021319091320037842, -0.00020595639944076538, -0.00019872188568115234, -0.0001914873719215393, -0.00018425285816192627, -0.00017701834440231323, -0.0001697838306427002, -0.00016254931688308716, -0.00015531480312347412, -0.00014808028936386108, -0.00014084577560424805, -0.000133611261844635, -0.00012637674808502197, -0.00011914223432540894, -0.0001119077205657959, -0.00010467320680618286, -9.743869304656982e-05, -9.020417928695679e-05, -8.296966552734375e-05, -7.573515176773071e-05, -6.850063800811768e-05, -6.126612424850464e-05, -5.40316104888916e-05, -4.6797096729278564e-05, -3.956258296966553e-05, -3.232806921005249e-05, -2.5093555450439453e-05, -1.7859041690826416e-05, -1.0624527931213379e-05, -3.390014171600342e-06, 3.844499588012695e-06, 1.1079013347625732e-05, 1.831352710723877e-05, 2.5548040866851807e-05, 3.2782554626464844e-05, 4.001706838607788e-05, 4.725158214569092e-05, 5.4486095905303955e-05, 6.172060966491699e-05, 6.895512342453003e-05, 7.618963718414307e-05, 8.34241509437561e-05, 9.065866470336914e-05, 9.789317846298218e-05, 0.00010512769222259521, 0.00011236220598220825, 0.00011959671974182129, 0.00012683123350143433, 0.00013406574726104736, 0.0001413002610206604, 0.00014853477478027344, 0.00015576928853988647, 0.0001630038022994995, 0.00017023831605911255, 0.00017747282981872559, 0.00018470734357833862, 0.00019194185733795166, 0.0001991763710975647, 0.00020641088485717773]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 5.0, 6.0, 13.0, 15.0, 13.0, 17.0, 17.0, 23.0, 38.0, 36.0, 48.0, 49.0, 38.0, 35.0, 53.0, 48.0, 45.0, 37.0, 31.0, 34.0, 35.0, 29.0, 33.0, 41.0, 44.0, 25.0, 29.0, 26.0, 19.0, 19.0, 23.0, 13.0, 8.0, 10.0, 3.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.51171875, -4.388824462890625, -4.26593017578125, -4.143035888671875, -4.0201416015625, -3.897247314453125, -3.77435302734375, -3.651458740234375, -3.528564453125, -3.405670166015625, -3.28277587890625, -3.159881591796875, -3.0369873046875, -2.914093017578125, -2.79119873046875, -2.668304443359375, -2.54541015625, -2.422515869140625, -2.29962158203125, -2.176727294921875, -2.0538330078125, -1.930938720703125, -1.80804443359375, -1.685150146484375, -1.562255859375, -1.439361572265625, -1.31646728515625, -1.193572998046875, -1.0706787109375, -0.947784423828125, -0.82489013671875, -0.701995849609375, -0.5791015625, -0.456207275390625, -0.33331298828125, -0.210418701171875, -0.0875244140625, 0.035369873046875, 0.15826416015625, 0.281158447265625, 0.404052734375, 0.526947021484375, 0.64984130859375, 0.772735595703125, 0.8956298828125, 1.018524169921875, 1.14141845703125, 1.264312744140625, 1.38720703125, 1.510101318359375, 1.63299560546875, 1.755889892578125, 1.8787841796875, 2.001678466796875, 2.12457275390625, 2.247467041015625, 2.370361328125, 2.493255615234375, 2.61614990234375, 2.739044189453125, 2.8619384765625, 2.984832763671875, 3.10772705078125, 3.230621337890625, 3.353515625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 8.0, 5.0, 14.0, 13.0, 16.0, 18.0, 22.0, 36.0, 56.0, 60.0, 102.0, 112.0, 166.0, 246.0, 334.0, 644.0, 2070.0, 9036.0, 46324.0, 310888.0, 558504.0, 96448.0, 17400.0, 3628.0, 942.0, 450.0, 278.0, 188.0, 134.0, 94.0, 80.0, 64.0, 34.0, 36.0, 20.0, 21.0, 19.0, 12.0, 12.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-7.9609375, -7.7469482421875, -7.532958984375, -7.3189697265625, -7.10498046875, -6.8909912109375, -6.677001953125, -6.4630126953125, -6.2490234375, -6.0350341796875, -5.821044921875, -5.6070556640625, -5.39306640625, -5.1790771484375, -4.965087890625, -4.7510986328125, -4.537109375, -4.3231201171875, -4.109130859375, -3.8951416015625, -3.68115234375, -3.4671630859375, -3.253173828125, -3.0391845703125, -2.8251953125, -2.6112060546875, -2.397216796875, -2.1832275390625, -1.96923828125, -1.7552490234375, -1.541259765625, -1.3272705078125, -1.11328125, -0.8992919921875, -0.685302734375, -0.4713134765625, -0.25732421875, -0.0433349609375, 0.170654296875, 0.3846435546875, 0.5986328125, 0.8126220703125, 1.026611328125, 1.2406005859375, 1.45458984375, 1.6685791015625, 1.882568359375, 2.0965576171875, 2.310546875, 2.5245361328125, 2.738525390625, 2.9525146484375, 3.16650390625, 3.3804931640625, 3.594482421875, 3.8084716796875, 4.0224609375, 4.2364501953125, 4.450439453125, 4.6644287109375, 4.87841796875, 5.0924072265625, 5.306396484375, 5.5203857421875, 5.734375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 1.0, 12.0, 8.0, 9.0, 16.0, 15.0, 15.0, 13.0, 13.0, 17.0, 21.0, 29.0, 24.0, 34.0, 34.0, 43.0, 47.0, 58.0, 77.0, 211.0, 1548.0, 288.0, 97.0, 75.0, 39.0, 47.0, 28.0, 28.0, 31.0, 30.0, 22.0, 17.0, 14.0, 19.0, 15.0, 12.0, 11.0, 9.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.108154296875, -13.70068359375, -13.293212890625, -12.8857421875, -12.478271484375, -12.07080078125, -11.663330078125, -11.255859375, -10.848388671875, -10.44091796875, -10.033447265625, -9.6259765625, -9.218505859375, -8.81103515625, -8.403564453125, -7.99609375, -7.588623046875, -7.18115234375, -6.773681640625, -6.3662109375, -5.958740234375, -5.55126953125, -5.143798828125, -4.736328125, -4.328857421875, -3.92138671875, -3.513916015625, -3.1064453125, -2.698974609375, -2.29150390625, -1.884033203125, -1.4765625, -1.069091796875, -0.66162109375, -0.254150390625, 0.1533203125, 0.560791015625, 0.96826171875, 1.375732421875, 1.783203125, 2.190673828125, 2.59814453125, 3.005615234375, 3.4130859375, 3.820556640625, 4.22802734375, 4.635498046875, 5.04296875, 5.450439453125, 5.85791015625, 6.265380859375, 6.6728515625, 7.080322265625, 7.48779296875, 7.895263671875, 8.302734375, 8.710205078125, 9.11767578125, 9.525146484375, 9.9326171875, 10.340087890625, 10.74755859375, 11.155029296875, 11.5625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 9.0, 9.0, 12.0, 12.0, 18.0, 22.0, 26.0, 35.0, 48.0, 40.0, 67.0, 90.0, 113.0, 193.0, 319.0, 765.0, 2632.0, 212936.0, 2919316.0, 6657.0, 1047.0, 419.0, 276.0, 161.0, 125.0, 52.0, 56.0, 42.0, 33.0, 28.0, 25.0, 17.0, 23.0, 21.0, 10.0, 6.0, 12.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.3125, -28.37255859375, -27.4326171875, -26.49267578125, -25.552734375, -24.61279296875, -23.6728515625, -22.73291015625, -21.79296875, -20.85302734375, -19.9130859375, -18.97314453125, -18.033203125, -17.09326171875, -16.1533203125, -15.21337890625, -14.2734375, -13.33349609375, -12.3935546875, -11.45361328125, -10.513671875, -9.57373046875, -8.6337890625, -7.69384765625, -6.75390625, -5.81396484375, -4.8740234375, -3.93408203125, -2.994140625, -2.05419921875, -1.1142578125, -0.17431640625, 0.765625, 1.70556640625, 2.6455078125, 3.58544921875, 4.525390625, 5.46533203125, 6.4052734375, 7.34521484375, 8.28515625, 9.22509765625, 10.1650390625, 11.10498046875, 12.044921875, 12.98486328125, 13.9248046875, 14.86474609375, 15.8046875, 16.74462890625, 17.6845703125, 18.62451171875, 19.564453125, 20.50439453125, 21.4443359375, 22.38427734375, 23.32421875, 24.26416015625, 25.2041015625, 26.14404296875, 27.083984375, 28.02392578125, 28.9638671875, 29.90380859375, 30.84375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 39.0, 301.0, 507.0, 144.0, 21.0, 2.0], "bins": [-116.11796569824219, -114.19007873535156, -112.26219177246094, -110.33430480957031, -108.40641784667969, -106.47853088378906, -104.55064392089844, -102.62275695800781, -100.69486999511719, -98.76698303222656, -96.83909606933594, -94.91120910644531, -92.98332214355469, -91.05543518066406, -89.12754821777344, -87.19966125488281, -85.27177429199219, -83.34388732910156, -81.41600036621094, -79.48811340332031, -77.56022644042969, -75.63233947753906, -73.70445251464844, -71.77656555175781, -69.84867858886719, -67.92079162597656, -65.99290466308594, -64.06501770019531, -62.13713073730469, -60.20924377441406, -58.28135681152344, -56.35346984863281, -54.42558288574219, -52.49769592285156, -50.56980895996094, -48.64192199707031, -46.71403503417969, -44.78614807128906, -42.85826110839844, -40.93037414550781, -39.00248718261719, -37.07460021972656, -35.14671325683594, -33.21882629394531, -31.290939331054688, -29.363052368164062, -27.435165405273438, -25.507278442382812, -23.579391479492188, -21.651504516601562, -19.723617553710938, -17.795730590820312, -15.867843627929688, -13.939956665039062, -12.012069702148438, -10.084182739257812, -8.156296730041504, -6.228409767150879, -4.300522804260254, -2.372635841369629, -0.4447488784790039, 1.483138084411621, 3.411025047302246, 5.338912010192871, 7.266798973083496]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 3.0, 7.0, 6.0, 5.0, 8.0, 8.0, 2.0, 10.0, 6.0, 17.0, 9.0, 18.0, 19.0, 17.0, 22.0, 35.0, 36.0, 26.0, 36.0, 34.0, 19.0, 36.0, 44.0, 48.0, 37.0, 42.0, 37.0, 33.0, 41.0, 32.0, 37.0, 22.0, 30.0, 26.0, 27.0, 13.0, 21.0, 19.0, 17.0, 15.0, 18.0, 11.0, 6.0, 8.0, 11.0, 8.0, 8.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.790145874023438, -24.929243087768555, -24.068342208862305, -23.207439422607422, -22.346538543701172, -21.48563575744629, -20.624732971191406, -19.763832092285156, -18.902929306030273, -18.04202651977539, -17.18112564086914, -16.320222854614258, -15.459321022033691, -14.598419189453125, -13.737516403198242, -12.876614570617676, -12.01571273803711, -11.154810905456543, -10.293909072875977, -9.433006286621094, -8.572104454040527, -7.711202621459961, -6.850300312042236, -5.989398002624512, -5.128496170043945, -4.267594337463379, -3.4066920280456543, -2.545789957046509, -1.6848878860473633, -0.8239860534667969, 0.036916255950927734, 0.8978185653686523, 1.7587223052978516, 2.619624376296997, 3.4805264472961426, 4.341428756713867, 5.202330589294434, 6.063232421875, 6.924134731292725, 7.785037040710449, 8.645938873291016, 9.506840705871582, 10.367742538452148, 11.228645324707031, 12.089547157287598, 12.950448989868164, 13.811351776123047, 14.672253608703613, 15.53315544128418, 16.394058227539062, 17.254959106445312, 18.115861892700195, 18.976764678955078, 19.837665557861328, 20.69856834411621, 21.559471130371094, 22.420372009277344, 23.281274795532227, 24.142175674438477, 25.00307846069336, 25.86397933959961, 26.724882125854492, 27.585784912109375, 28.446685791015625, 29.307588577270508]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 2.0, 10.0, 12.0, 9.0, 13.0, 13.0, 17.0, 21.0, 25.0, 34.0, 46.0, 40.0, 42.0, 43.0, 50.0, 40.0, 41.0, 47.0, 33.0, 44.0, 42.0, 40.0, 28.0, 34.0, 36.0, 33.0, 33.0, 26.0, 37.0, 20.0, 19.0, 8.0, 11.0, 16.0, 4.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.9453125, -4.806671142578125, -4.66802978515625, -4.529388427734375, -4.3907470703125, -4.252105712890625, -4.11346435546875, -3.974822998046875, -3.836181640625, -3.697540283203125, -3.55889892578125, -3.420257568359375, -3.2816162109375, -3.142974853515625, -3.00433349609375, -2.865692138671875, -2.72705078125, -2.588409423828125, -2.44976806640625, -2.311126708984375, -2.1724853515625, -2.033843994140625, -1.89520263671875, -1.756561279296875, -1.617919921875, -1.479278564453125, -1.34063720703125, -1.201995849609375, -1.0633544921875, -0.924713134765625, -0.78607177734375, -0.647430419921875, -0.5087890625, -0.370147705078125, -0.23150634765625, -0.092864990234375, 0.0457763671875, 0.184417724609375, 0.32305908203125, 0.461700439453125, 0.600341796875, 0.738983154296875, 0.87762451171875, 1.016265869140625, 1.1549072265625, 1.293548583984375, 1.43218994140625, 1.570831298828125, 1.70947265625, 1.848114013671875, 1.98675537109375, 2.125396728515625, 2.2640380859375, 2.402679443359375, 2.54132080078125, 2.679962158203125, 2.818603515625, 2.957244873046875, 3.09588623046875, 3.234527587890625, 3.3731689453125, 3.511810302734375, 3.65045166015625, 3.789093017578125, 3.927734375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 6.0, 6.0, 7.0, 9.0, 10.0, 19.0, 13.0, 19.0, 29.0, 27.0, 41.0, 57.0, 82.0, 104.0, 168.0, 432.0, 1369.0, 22604.0, 1271267.0, 2771432.0, 122150.0, 3113.0, 607.0, 236.0, 123.0, 74.0, 52.0, 41.0, 43.0, 29.0, 28.0, 19.0, 21.0, 12.0, 10.0, 9.0, 8.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.490966796875, -11.12255859375, -10.754150390625, -10.3857421875, -10.017333984375, -9.64892578125, -9.280517578125, -8.912109375, -8.543701171875, -8.17529296875, -7.806884765625, -7.4384765625, -7.070068359375, -6.70166015625, -6.333251953125, -5.96484375, -5.596435546875, -5.22802734375, -4.859619140625, -4.4912109375, -4.122802734375, -3.75439453125, -3.385986328125, -3.017578125, -2.649169921875, -2.28076171875, -1.912353515625, -1.5439453125, -1.175537109375, -0.80712890625, -0.438720703125, -0.0703125, 0.298095703125, 0.66650390625, 1.034912109375, 1.4033203125, 1.771728515625, 2.14013671875, 2.508544921875, 2.876953125, 3.245361328125, 3.61376953125, 3.982177734375, 4.3505859375, 4.718994140625, 5.08740234375, 5.455810546875, 5.82421875, 6.192626953125, 6.56103515625, 6.929443359375, 7.2978515625, 7.666259765625, 8.03466796875, 8.403076171875, 8.771484375, 9.139892578125, 9.50830078125, 9.876708984375, 10.2451171875, 10.613525390625, 10.98193359375, 11.350341796875, 11.71875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 8.0, 15.0, 21.0, 32.0, 29.0, 64.0, 85.0, 112.0, 159.0, 239.0, 303.0, 384.0, 504.0, 502.0, 413.0, 350.0, 241.0, 187.0, 132.0, 90.0, 56.0, 37.0, 28.0, 12.0, 15.0, 10.0, 4.0, 8.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.734375, -7.52655029296875, -7.3187255859375, -7.11090087890625, -6.903076171875, -6.69525146484375, -6.4874267578125, -6.27960205078125, -6.07177734375, -5.86395263671875, -5.6561279296875, -5.44830322265625, -5.240478515625, -5.03265380859375, -4.8248291015625, -4.61700439453125, -4.4091796875, -4.20135498046875, -3.9935302734375, -3.78570556640625, -3.577880859375, -3.37005615234375, -3.1622314453125, -2.95440673828125, -2.74658203125, -2.53875732421875, -2.3309326171875, -2.12310791015625, -1.915283203125, -1.70745849609375, -1.4996337890625, -1.29180908203125, -1.083984375, -0.87615966796875, -0.6683349609375, -0.46051025390625, -0.252685546875, -0.04486083984375, 0.1629638671875, 0.37078857421875, 0.57861328125, 0.78643798828125, 0.9942626953125, 1.20208740234375, 1.409912109375, 1.61773681640625, 1.8255615234375, 2.03338623046875, 2.2412109375, 2.44903564453125, 2.6568603515625, 2.86468505859375, 3.072509765625, 3.28033447265625, 3.4881591796875, 3.69598388671875, 3.90380859375, 4.11163330078125, 4.3194580078125, 4.52728271484375, 4.735107421875, 4.94293212890625, 5.1507568359375, 5.35858154296875, 5.56640625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 16.0, 14.0, 27.0, 22.0, 48.0, 63.0, 84.0, 120.0, 119.0, 258.0, 344.0, 598.0, 1553.0, 9364.0, 340108.0, 3670567.0, 161856.0, 6065.0, 1301.0, 557.0, 341.0, 242.0, 158.0, 130.0, 90.0, 53.0, 43.0, 38.0, 26.0, 12.0, 11.0, 13.0, 9.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5859375, -14.0726318359375, -13.559326171875, -13.0460205078125, -12.53271484375, -12.0194091796875, -11.506103515625, -10.9927978515625, -10.4794921875, -9.9661865234375, -9.452880859375, -8.9395751953125, -8.42626953125, -7.9129638671875, -7.399658203125, -6.8863525390625, -6.373046875, -5.8597412109375, -5.346435546875, -4.8331298828125, -4.31982421875, -3.8065185546875, -3.293212890625, -2.7799072265625, -2.2666015625, -1.7532958984375, -1.239990234375, -0.7266845703125, -0.21337890625, 0.2999267578125, 0.813232421875, 1.3265380859375, 1.83984375, 2.3531494140625, 2.866455078125, 3.3797607421875, 3.89306640625, 4.4063720703125, 4.919677734375, 5.4329833984375, 5.9462890625, 6.4595947265625, 6.972900390625, 7.4862060546875, 7.99951171875, 8.5128173828125, 9.026123046875, 9.5394287109375, 10.052734375, 10.5660400390625, 11.079345703125, 11.5926513671875, 12.10595703125, 12.6192626953125, 13.132568359375, 13.6458740234375, 14.1591796875, 14.6724853515625, 15.185791015625, 15.6990966796875, 16.21240234375, 16.7257080078125, 17.239013671875, 17.7523193359375, 18.265625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 42.0, 150.0, 266.0, 317.0, 159.0, 50.0, 16.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.89935302734375, -65.1007080078125, -63.30207061767578, -61.5034294128418, -59.70478820800781, -57.90614700317383, -56.107505798339844, -54.30886459350586, -52.510223388671875, -50.71158218383789, -48.912940979003906, -47.11429977416992, -45.31565856933594, -43.51701736450195, -41.71837615966797, -39.919734954833984, -38.12109375, -36.322452545166016, -34.52381134033203, -32.72517013549805, -30.926528930664062, -29.127887725830078, -27.329246520996094, -25.53060531616211, -23.73196029663086, -21.933319091796875, -20.13467788696289, -18.336036682128906, -16.537395477294922, -14.738753318786621, -12.940112113952637, -11.141470909118652, -9.342830657958984, -7.544189453125, -5.745548248291016, -3.946906566619873, -2.1482653617858887, -0.3496236801147461, 1.4490175247192383, 3.2476587295532227, 5.046299934387207, 6.844941139221191, 8.643582344055176, 10.442224502563477, 12.240865707397461, 14.039506912231445, 15.83814811706543, 17.636789321899414, 19.4354305267334, 21.234071731567383, 23.032712936401367, 24.83135414123535, 26.629995346069336, 28.428638458251953, 30.227279663085938, 32.02592086791992, 33.824562072753906, 35.62320327758789, 37.421844482421875, 39.22048568725586, 41.019126892089844, 42.81776809692383, 44.61640930175781, 46.4150505065918, 48.21369171142578]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 7.0, 9.0, 14.0, 16.0, 19.0, 29.0, 20.0, 25.0, 20.0, 29.0, 42.0, 32.0, 37.0, 46.0, 41.0, 48.0, 40.0, 40.0, 38.0, 43.0, 39.0, 46.0, 36.0, 28.0, 36.0, 35.0, 33.0, 19.0, 11.0, 19.0, 14.0, 19.0, 14.0, 14.0, 9.0, 10.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.433757781982422, -21.74953269958496, -21.065309524536133, -20.381084442138672, -19.696861267089844, -19.012636184692383, -18.328411102294922, -17.644187927246094, -16.959962844848633, -16.275737762451172, -15.591514587402344, -14.907289505004883, -14.223065376281738, -13.538841247558594, -12.854616165161133, -12.170392036437988, -11.486167907714844, -10.8019437789917, -10.117719650268555, -9.433494567871094, -8.74927043914795, -8.065046310424805, -7.380821704864502, -6.696597099304199, -6.012372970581055, -5.32814884185791, -4.643924236297607, -3.959699869155884, -3.27547550201416, -2.5912511348724365, -1.907026767730713, -1.2228021621704102, -0.5385780334472656, 0.145646333694458, 0.8298707008361816, 1.5140950679779053, 2.198319435119629, 2.8825438022613525, 3.566768169403076, 4.250992774963379, 4.935216903686523, 5.619441032409668, 6.303665637969971, 6.987890243530273, 7.672114372253418, 8.356338500976562, 9.040563583374023, 9.724787712097168, 10.409011840820312, 11.093235969543457, 11.777460098266602, 12.461685180664062, 13.145909309387207, 13.830133438110352, 14.514358520507812, 15.198582649230957, 15.882806777954102, 16.567031860351562, 17.25125503540039, 17.93548011779785, 18.619705200195312, 19.30392837524414, 19.9881534576416, 20.672378540039062, 21.35660171508789]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 9.0, 10.0, 14.0, 16.0, 17.0, 21.0, 26.0, 19.0, 36.0, 24.0, 33.0, 27.0, 35.0, 40.0, 39.0, 41.0, 38.0, 45.0, 38.0, 53.0, 26.0, 40.0, 29.0, 31.0, 36.0, 36.0, 26.0, 30.0, 22.0, 24.0, 22.0, 13.0, 14.0, 14.0, 12.0, 6.0, 6.0, 6.0, 1.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.86309814453125, -3.7379150390625, -3.61273193359375, -3.487548828125, -3.36236572265625, -3.2371826171875, -3.11199951171875, -2.98681640625, -2.86163330078125, -2.7364501953125, -2.61126708984375, -2.486083984375, -2.36090087890625, -2.2357177734375, -2.11053466796875, -1.9853515625, -1.86016845703125, -1.7349853515625, -1.60980224609375, -1.484619140625, -1.35943603515625, -1.2342529296875, -1.10906982421875, -0.98388671875, -0.85870361328125, -0.7335205078125, -0.60833740234375, -0.483154296875, -0.35797119140625, -0.2327880859375, -0.10760498046875, 0.017578125, 0.14276123046875, 0.2679443359375, 0.39312744140625, 0.518310546875, 0.64349365234375, 0.7686767578125, 0.89385986328125, 1.01904296875, 1.14422607421875, 1.2694091796875, 1.39459228515625, 1.519775390625, 1.64495849609375, 1.7701416015625, 1.89532470703125, 2.0205078125, 2.14569091796875, 2.2708740234375, 2.39605712890625, 2.521240234375, 2.64642333984375, 2.7716064453125, 2.89678955078125, 3.02197265625, 3.14715576171875, 3.2723388671875, 3.39752197265625, 3.522705078125, 3.64788818359375, 3.7730712890625, 3.89825439453125, 4.0234375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 5.0, 9.0, 22.0, 29.0, 39.0, 71.0, 104.0, 126.0, 232.0, 377.0, 617.0, 989.0, 1568.0, 2436.0, 4054.0, 6472.0, 10800.0, 17945.0, 29946.0, 52393.0, 97591.0, 236002.0, 314240.0, 122082.0, 61900.0, 35485.0, 20680.0, 12501.0, 7597.0, 4594.0, 2875.0, 1751.0, 1125.0, 680.0, 448.0, 261.0, 177.0, 119.0, 65.0, 42.0, 35.0, 19.0, 15.0, 14.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.84619140625, -0.8206634521484375, -0.795135498046875, -0.7696075439453125, -0.74407958984375, -0.7185516357421875, -0.693023681640625, -0.6674957275390625, -0.6419677734375, -0.6164398193359375, -0.590911865234375, -0.5653839111328125, -0.53985595703125, -0.5143280029296875, -0.488800048828125, -0.4632720947265625, -0.437744140625, -0.4122161865234375, -0.386688232421875, -0.3611602783203125, -0.33563232421875, -0.3101043701171875, -0.284576416015625, -0.2590484619140625, -0.2335205078125, -0.2079925537109375, -0.182464599609375, -0.1569366455078125, -0.13140869140625, -0.1058807373046875, -0.080352783203125, -0.0548248291015625, -0.029296875, -0.0037689208984375, 0.021759033203125, 0.0472869873046875, 0.07281494140625, 0.0983428955078125, 0.123870849609375, 0.1493988037109375, 0.1749267578125, 0.2004547119140625, 0.225982666015625, 0.2515106201171875, 0.27703857421875, 0.3025665283203125, 0.328094482421875, 0.3536224365234375, 0.379150390625, 0.4046783447265625, 0.430206298828125, 0.4557342529296875, 0.48126220703125, 0.5067901611328125, 0.532318115234375, 0.5578460693359375, 0.5833740234375, 0.6089019775390625, 0.634429931640625, 0.6599578857421875, 0.68548583984375, 0.7110137939453125, 0.736541748046875, 0.7620697021484375, 0.78759765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 6.0, 10.0, 9.0, 7.0, 15.0, 11.0, 9.0, 8.0, 13.0, 15.0, 29.0, 31.0, 14.0, 22.0, 29.0, 24.0, 34.0, 25.0, 28.0, 37.0, 38.0, 28.0, 38.0, 1050.0, 32.0, 39.0, 38.0, 37.0, 31.0, 31.0, 38.0, 26.0, 25.0, 20.0, 24.0, 19.0, 11.0, 23.0, 14.0, 13.0, 15.0, 10.0, 12.0, 10.0, 4.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.0703125, -2.00360107421875, -1.9368896484375, -1.87017822265625, -1.803466796875, -1.73675537109375, -1.6700439453125, -1.60333251953125, -1.53662109375, -1.46990966796875, -1.4031982421875, -1.33648681640625, -1.269775390625, -1.20306396484375, -1.1363525390625, -1.06964111328125, -1.0029296875, -0.93621826171875, -0.8695068359375, -0.80279541015625, -0.736083984375, -0.66937255859375, -0.6026611328125, -0.53594970703125, -0.46923828125, -0.40252685546875, -0.3358154296875, -0.26910400390625, -0.202392578125, -0.13568115234375, -0.0689697265625, -0.00225830078125, 0.064453125, 0.13116455078125, 0.1978759765625, 0.26458740234375, 0.331298828125, 0.39801025390625, 0.4647216796875, 0.53143310546875, 0.59814453125, 0.66485595703125, 0.7315673828125, 0.79827880859375, 0.864990234375, 0.93170166015625, 0.9984130859375, 1.06512451171875, 1.1318359375, 1.19854736328125, 1.2652587890625, 1.33197021484375, 1.398681640625, 1.46539306640625, 1.5321044921875, 1.59881591796875, 1.66552734375, 1.73223876953125, 1.7989501953125, 1.86566162109375, 1.932373046875, 1.99908447265625, 2.0657958984375, 2.13250732421875, 2.19921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 3.0, 8.0, 11.0, 9.0, 18.0, 39.0, 53.0, 52.0, 103.0, 158.0, 253.0, 330.0, 469.0, 743.0, 1016.0, 1511.0, 2075.0, 3073.0, 4284.0, 6291.0, 9141.0, 13337.0, 19867.0, 30493.0, 47845.0, 78366.0, 142936.0, 1306025.0, 175759.0, 92696.0, 54916.0, 34461.0, 22846.0, 14815.0, 10109.0, 6943.0, 4952.0, 3418.0, 2405.0, 1604.0, 1220.0, 807.0, 516.0, 416.0, 243.0, 163.0, 120.0, 81.0, 53.0, 28.0, 23.0, 16.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.59814453125, -0.5792465209960938, -0.5603485107421875, -0.5414505004882812, -0.522552490234375, -0.5036544799804688, -0.4847564697265625, -0.46585845947265625, -0.44696044921875, -0.42806243896484375, -0.4091644287109375, -0.39026641845703125, -0.371368408203125, -0.35247039794921875, -0.3335723876953125, -0.31467437744140625, -0.2957763671875, -0.27687835693359375, -0.2579803466796875, -0.23908233642578125, -0.220184326171875, -0.20128631591796875, -0.1823883056640625, -0.16349029541015625, -0.14459228515625, -0.12569427490234375, -0.1067962646484375, -0.08789825439453125, -0.069000244140625, -0.05010223388671875, -0.0312042236328125, -0.01230621337890625, 0.006591796875, 0.02548980712890625, 0.0443878173828125, 0.06328582763671875, 0.082183837890625, 0.10108184814453125, 0.1199798583984375, 0.13887786865234375, 0.15777587890625, 0.17667388916015625, 0.1955718994140625, 0.21446990966796875, 0.233367919921875, 0.25226593017578125, 0.2711639404296875, 0.29006195068359375, 0.3089599609375, 0.32785797119140625, 0.3467559814453125, 0.36565399169921875, 0.384552001953125, 0.40345001220703125, 0.4223480224609375, 0.44124603271484375, 0.46014404296875, 0.47904205322265625, 0.4979400634765625, 0.5168380737304688, 0.535736083984375, 0.5546340942382812, 0.5735321044921875, 0.5924301147460938, 0.611328125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 2.0, 11.0, 12.0, 11.0, 12.0, 10.0, 19.0, 26.0, 25.0, 33.0, 33.0, 37.0, 43.0, 43.0, 45.0, 34.0, 70.0, 40.0, 59.0, 44.0, 54.0, 47.0, 42.0, 41.0, 27.0, 36.0, 19.0, 23.0, 18.0, 9.0, 13.0, 15.0, 7.0, 8.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.0004208087921142578, -0.00040893256664276123, -0.00039705634117126465, -0.00038518011569976807, -0.0003733038902282715, -0.0003614276647567749, -0.0003495514392852783, -0.00033767521381378174, -0.00032579898834228516, -0.0003139227628707886, -0.000302046537399292, -0.0002901703119277954, -0.00027829408645629883, -0.00026641786098480225, -0.00025454163551330566, -0.00024266541004180908, -0.0002307891845703125, -0.00021891295909881592, -0.00020703673362731934, -0.00019516050815582275, -0.00018328428268432617, -0.0001714080572128296, -0.000159531831741333, -0.00014765560626983643, -0.00013577938079833984, -0.00012390315532684326, -0.00011202692985534668, -0.0001001507043838501, -8.827447891235352e-05, -7.639825344085693e-05, -6.452202796936035e-05, -5.264580249786377e-05, -4.076957702636719e-05, -2.8893351554870605e-05, -1.7017126083374023e-05, -5.140900611877441e-06, 6.735324859619141e-06, 1.8611550331115723e-05, 3.0487775802612305e-05, 4.236400127410889e-05, 5.424022674560547e-05, 6.611645221710205e-05, 7.799267768859863e-05, 8.986890316009521e-05, 0.0001017451286315918, 0.00011362135410308838, 0.00012549757957458496, 0.00013737380504608154, 0.00014925003051757812, 0.0001611262559890747, 0.0001730024814605713, 0.00018487870693206787, 0.00019675493240356445, 0.00020863115787506104, 0.00022050738334655762, 0.0002323836088180542, 0.0002442598342895508, 0.00025613605976104736, 0.00026801228523254395, 0.00027988851070404053, 0.0002917647361755371, 0.0003036409616470337, 0.0003155171871185303, 0.00032739341259002686, 0.00033926963806152344]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 7.0, 9.0, 11.0, 14.0, 15.0, 21.0, 30.0, 33.0, 42.0, 52.0, 76.0, 91.0, 108.0, 212.0, 310.0, 559.0, 1446.0, 627563.0, 415057.0, 1296.0, 577.0, 299.0, 162.0, 119.0, 96.0, 68.0, 52.0, 48.0, 28.0, 27.0, 21.0, 16.0, 16.0, 18.0, 9.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007129669189453125, -0.006883561611175537, -0.006637454032897949, -0.006391346454620361, -0.0061452388763427734, -0.0058991312980651855, -0.005653023719787598, -0.00540691614151001, -0.005160808563232422, -0.004914700984954834, -0.004668593406677246, -0.004422485828399658, -0.00417637825012207, -0.003930270671844482, -0.0036841630935668945, -0.0034380555152893066, -0.0031919479370117188, -0.002945840358734131, -0.002699732780456543, -0.002453625202178955, -0.002207517623901367, -0.0019614100456237793, -0.0017153024673461914, -0.0014691948890686035, -0.0012230873107910156, -0.0009769797325134277, -0.0007308721542358398, -0.00048476457595825195, -0.00023865699768066406, 7.450580596923828e-06, 0.0002535581588745117, 0.0004996657371520996, 0.0007457733154296875, 0.0009918808937072754, 0.0012379884719848633, 0.0014840960502624512, 0.001730203628540039, 0.001976311206817627, 0.002222418785095215, 0.0024685263633728027, 0.0027146339416503906, 0.0029607415199279785, 0.0032068490982055664, 0.0034529566764831543, 0.003699064254760742, 0.00394517183303833, 0.004191279411315918, 0.004437386989593506, 0.004683494567871094, 0.004929602146148682, 0.0051757097244262695, 0.005421817302703857, 0.005667924880981445, 0.005914032459259033, 0.006160140037536621, 0.006406247615814209, 0.006652355194091797, 0.006898462772369385, 0.007144570350646973, 0.0073906779289245605, 0.0076367855072021484, 0.007882893085479736, 0.008129000663757324, 0.008375108242034912, 0.0086212158203125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 57.0, 706.0, 243.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015413217479363084, -0.0014942148700356483, -0.0014471081085503101, -0.00140000123064965, -0.00135289435274899, -0.00130578747484833, -0.00125868059694767, -0.0012115738354623318, -0.0011644669575616717, -0.0011173600796610117, -0.0010702533181756735, -0.0010231464402750134, -0.0009760395623743534, -0.0009289326844736934, -0.0008818258647806942, -0.0008347190450876951, -0.0007876121671870351, -0.000740505289286375, -0.0006933984695933759, -0.0006462916499003768, -0.0005991847719997168, -0.0005520778940990567, -0.0005049710744060576, -0.000457864225609228, -0.00041075737681239843, -0.00036365052801556885, -0.00031654367921873927, -0.0002694368304219097, -0.0002223299816250801, -0.00017522313282825053, -0.00012811628403142095, -8.100943523459136e-05, -3.390270285308361e-05, 1.320414594374597e-05, 6.031099474057555e-05, 0.00010741784353740513, 0.00015452469233423471, 0.0002016315411310643, 0.0002487383899278939, 0.00029584523872472346, 0.00034295208752155304, 0.0003900589363183826, 0.0004371657851152122, 0.0004842726339120418, 0.0005313794827088714, 0.0005784863606095314, 0.0006255931803025305, 0.0006726999999955297, 0.0007198068778961897, 0.0007669137557968497, 0.0008140205754898489, 0.000861127395182848, 0.000908234273083508, 0.000955341150984168, 0.0010024479124695063, 0.0010495547903701663, 0.0010966616682708263, 0.0011437685461714864, 0.0011908754240721464, 0.0012379821855574846, 0.0012850890634581447, 0.0013321959413588047, 0.001379302702844143, 0.001426409580744803, 0.001473516458645463]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 7.0, 7.0, 11.0, 18.0, 23.0, 23.0, 23.0, 19.0, 35.0, 35.0, 43.0, 43.0, 32.0, 39.0, 42.0, 37.0, 50.0, 49.0, 28.0, 44.0, 42.0, 45.0, 37.0, 34.0, 36.0, 27.0, 27.0, 25.0, 18.0, 23.0, 17.0, 12.0, 9.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002117156982421875, -0.00020445510745048523, -0.00019719451665878296, -0.0001899339258670807, -0.00018267333507537842, -0.00017541274428367615, -0.00016815215349197388, -0.0001608915627002716, -0.00015363097190856934, -0.00014637038111686707, -0.0001391097903251648, -0.00013184919953346252, -0.00012458860874176025, -0.00011732801795005798, -0.00011006742715835571, -0.00010280683636665344, -9.554624557495117e-05, -8.82856547832489e-05, -8.102506399154663e-05, -7.376447319984436e-05, -6.650388240814209e-05, -5.924329161643982e-05, -5.198270082473755e-05, -4.472211003303528e-05, -3.746151924133301e-05, -3.0200928449630737e-05, -2.2940337657928467e-05, -1.5679746866226196e-05, -8.419156074523926e-06, -1.1585652828216553e-06, 6.102025508880615e-06, 1.3362616300582886e-05, 2.0623207092285156e-05, 2.7883797883987427e-05, 3.51443886756897e-05, 4.240497946739197e-05, 4.966557025909424e-05, 5.692616105079651e-05, 6.418675184249878e-05, 7.144734263420105e-05, 7.870793342590332e-05, 8.596852421760559e-05, 9.322911500930786e-05, 0.00010048970580101013, 0.0001077502965927124, 0.00011501088738441467, 0.00012227147817611694, 0.00012953206896781921, 0.00013679265975952148, 0.00014405325055122375, 0.00015131384134292603, 0.0001585744321346283, 0.00016583502292633057, 0.00017309561371803284, 0.0001803562045097351, 0.00018761679530143738, 0.00019487738609313965, 0.00020213797688484192, 0.0002093985676765442, 0.00021665915846824646, 0.00022391974925994873, 0.000231180340051651, 0.00023844093084335327, 0.00024570152163505554, 0.0002529621124267578]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 9.0, 10.0, 14.0, 16.0, 17.0, 21.0, 26.0, 19.0, 36.0, 24.0, 33.0, 27.0, 35.0, 40.0, 39.0, 41.0, 38.0, 45.0, 38.0, 53.0, 26.0, 40.0, 29.0, 31.0, 36.0, 36.0, 26.0, 30.0, 22.0, 24.0, 22.0, 13.0, 14.0, 14.0, 12.0, 6.0, 6.0, 6.0, 1.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.86309814453125, -3.7379150390625, -3.61273193359375, -3.487548828125, -3.36236572265625, -3.2371826171875, -3.11199951171875, -2.98681640625, -2.86163330078125, -2.7364501953125, -2.61126708984375, -2.486083984375, -2.36090087890625, -2.2357177734375, -2.11053466796875, -1.9853515625, -1.86016845703125, -1.7349853515625, -1.60980224609375, -1.484619140625, -1.35943603515625, -1.2342529296875, -1.10906982421875, -0.98388671875, -0.85870361328125, -0.7335205078125, -0.60833740234375, -0.483154296875, -0.35797119140625, -0.2327880859375, -0.10760498046875, 0.017578125, 0.14276123046875, 0.2679443359375, 0.39312744140625, 0.518310546875, 0.64349365234375, 0.7686767578125, 0.89385986328125, 1.01904296875, 1.14422607421875, 1.2694091796875, 1.39459228515625, 1.519775390625, 1.64495849609375, 1.7701416015625, 1.89532470703125, 2.0205078125, 2.14569091796875, 2.2708740234375, 2.39605712890625, 2.521240234375, 2.64642333984375, 2.7716064453125, 2.89678955078125, 3.02197265625, 3.14715576171875, 3.2723388671875, 3.39752197265625, 3.522705078125, 3.64788818359375, 3.7730712890625, 3.89825439453125, 4.0234375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 8.0, 7.0, 11.0, 9.0, 20.0, 24.0, 39.0, 44.0, 60.0, 91.0, 98.0, 151.0, 219.0, 269.0, 346.0, 485.0, 742.0, 1425.0, 4955.0, 28368.0, 311394.0, 638872.0, 48429.0, 7709.0, 1858.0, 820.0, 544.0, 404.0, 321.0, 221.0, 141.0, 113.0, 100.0, 65.0, 44.0, 37.0, 29.0, 25.0, 19.0, 9.0, 6.0, 2.0, 6.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.7418212890625, -9.428955078125, -9.1160888671875, -8.80322265625, -8.4903564453125, -8.177490234375, -7.8646240234375, -7.5517578125, -7.2388916015625, -6.926025390625, -6.6131591796875, -6.30029296875, -5.9874267578125, -5.674560546875, -5.3616943359375, -5.048828125, -4.7359619140625, -4.423095703125, -4.1102294921875, -3.79736328125, -3.4844970703125, -3.171630859375, -2.8587646484375, -2.5458984375, -2.2330322265625, -1.920166015625, -1.6072998046875, -1.29443359375, -0.9815673828125, -0.668701171875, -0.3558349609375, -0.04296875, 0.2698974609375, 0.582763671875, 0.8956298828125, 1.20849609375, 1.5213623046875, 1.834228515625, 2.1470947265625, 2.4599609375, 2.7728271484375, 3.085693359375, 3.3985595703125, 3.71142578125, 4.0242919921875, 4.337158203125, 4.6500244140625, 4.962890625, 5.2757568359375, 5.588623046875, 5.9014892578125, 6.21435546875, 6.5272216796875, 6.840087890625, 7.1529541015625, 7.4658203125, 7.7786865234375, 8.091552734375, 8.4044189453125, 8.71728515625, 9.0301513671875, 9.343017578125, 9.6558837890625, 9.96875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 11.0, 5.0, 16.0, 16.0, 18.0, 20.0, 32.0, 23.0, 39.0, 30.0, 34.0, 39.0, 59.0, 56.0, 86.0, 180.0, 1621.0, 274.0, 94.0, 74.0, 39.0, 45.0, 39.0, 43.0, 26.0, 27.0, 20.0, 14.0, 13.0, 17.0, 7.0, 11.0, 11.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.0604248046875, -14.613037109375, -14.1656494140625, -13.71826171875, -13.2708740234375, -12.823486328125, -12.3760986328125, -11.9287109375, -11.4813232421875, -11.033935546875, -10.5865478515625, -10.13916015625, -9.6917724609375, -9.244384765625, -8.7969970703125, -8.349609375, -7.9022216796875, -7.454833984375, -7.0074462890625, -6.56005859375, -6.1126708984375, -5.665283203125, -5.2178955078125, -4.7705078125, -4.3231201171875, -3.875732421875, -3.4283447265625, -2.98095703125, -2.5335693359375, -2.086181640625, -1.6387939453125, -1.19140625, -0.7440185546875, -0.296630859375, 0.1507568359375, 0.59814453125, 1.0455322265625, 1.492919921875, 1.9403076171875, 2.3876953125, 2.8350830078125, 3.282470703125, 3.7298583984375, 4.17724609375, 4.6246337890625, 5.072021484375, 5.5194091796875, 5.966796875, 6.4141845703125, 6.861572265625, 7.3089599609375, 7.75634765625, 8.2037353515625, 8.651123046875, 9.0985107421875, 9.5458984375, 9.9932861328125, 10.440673828125, 10.8880615234375, 11.33544921875, 11.7828369140625, 12.230224609375, 12.6776123046875, 13.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 9.0, 13.0, 15.0, 10.0, 21.0, 16.0, 21.0, 40.0, 53.0, 49.0, 75.0, 111.0, 193.0, 307.0, 769.0, 3352.0, 1588569.0, 1546780.0, 3514.0, 732.0, 324.0, 209.0, 125.0, 85.0, 58.0, 52.0, 40.0, 25.0, 32.0, 17.0, 10.0, 22.0, 12.0, 11.0, 9.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4375, -33.28955078125, -32.1416015625, -30.99365234375, -29.845703125, -28.69775390625, -27.5498046875, -26.40185546875, -25.25390625, -24.10595703125, -22.9580078125, -21.81005859375, -20.662109375, -19.51416015625, -18.3662109375, -17.21826171875, -16.0703125, -14.92236328125, -13.7744140625, -12.62646484375, -11.478515625, -10.33056640625, -9.1826171875, -8.03466796875, -6.88671875, -5.73876953125, -4.5908203125, -3.44287109375, -2.294921875, -1.14697265625, 0.0009765625, 1.14892578125, 2.296875, 3.44482421875, 4.5927734375, 5.74072265625, 6.888671875, 8.03662109375, 9.1845703125, 10.33251953125, 11.48046875, 12.62841796875, 13.7763671875, 14.92431640625, 16.072265625, 17.22021484375, 18.3681640625, 19.51611328125, 20.6640625, 21.81201171875, 22.9599609375, 24.10791015625, 25.255859375, 26.40380859375, 27.5517578125, 28.69970703125, 29.84765625, 30.99560546875, 32.1435546875, 33.29150390625, 34.439453125, 35.58740234375, 36.7353515625, 37.88330078125, 39.03125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 46.0, 157.0, 291.0, 281.0, 162.0, 50.0, 13.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.175193786621094, -38.2205810546875, -37.26596450805664, -36.31134796142578, -35.35673522949219, -34.402122497558594, -33.447505950927734, -32.492889404296875, -31.53827667236328, -30.583662033081055, -29.629047393798828, -28.6744327545166, -27.719818115234375, -26.76520347595215, -25.810588836669922, -24.855974197387695, -23.90135955810547, -22.946744918823242, -21.992130279541016, -21.03751564025879, -20.082901000976562, -19.128286361694336, -18.17367172241211, -17.219057083129883, -16.264442443847656, -15.30982780456543, -14.355213165283203, -13.400598526000977, -12.44598388671875, -11.491369247436523, -10.536754608154297, -9.58213996887207, -8.627527236938477, -7.67291259765625, -6.718297958374023, -5.763683319091797, -4.80906867980957, -3.8544540405273438, -2.899839401245117, -1.9452247619628906, -0.9906101226806641, -0.0359954833984375, 0.9186191558837891, 1.8732337951660156, 2.827848434448242, 3.7824630737304688, 4.737077713012695, 5.691692352294922, 6.646306991577148, 7.600921630859375, 8.555536270141602, 9.510150909423828, 10.464765548706055, 11.419380187988281, 12.373994827270508, 13.328609466552734, 14.283224105834961, 15.237838745117188, 16.192453384399414, 17.14706802368164, 18.101682662963867, 19.056297302246094, 20.01091194152832, 20.965526580810547, 21.920141220092773]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 7.0, 4.0, 6.0, 8.0, 15.0, 11.0, 13.0, 14.0, 12.0, 26.0, 15.0, 19.0, 29.0, 26.0, 34.0, 29.0, 38.0, 37.0, 45.0, 34.0, 47.0, 32.0, 40.0, 48.0, 39.0, 34.0, 36.0, 33.0, 35.0, 23.0, 37.0, 17.0, 24.0, 24.0, 14.0, 17.0, 13.0, 15.0, 19.0, 3.0, 4.0, 3.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.897613525390625, -25.985258102416992, -25.07290267944336, -24.16054916381836, -23.248193740844727, -22.335838317871094, -21.42348289489746, -20.511127471923828, -19.598772048950195, -18.686416625976562, -17.77406120300293, -16.861705780029297, -15.94935131072998, -15.036996841430664, -14.124641418457031, -13.212285995483398, -12.299931526184082, -11.38757610321045, -10.475221633911133, -9.5628662109375, -8.650510787963867, -7.738155841827393, -6.825800895690918, -5.913445472717285, -5.0010905265808105, -4.088735580444336, -3.176380157470703, -2.2640252113342285, -1.3516700267791748, -0.4393148422241211, 0.4730401039123535, 1.3853955268859863, 2.297750473022461, 3.2101056575775146, 4.122460842132568, 5.034815788269043, 5.947171211242676, 6.85952615737915, 7.771881103515625, 8.684236526489258, 9.59659194946289, 10.508947372436523, 11.42130184173584, 12.333657264709473, 13.246012687683105, 14.158367156982422, 15.070722579956055, 15.983078002929688, 16.895431518554688, 17.80778694152832, 18.720142364501953, 19.632495880126953, 20.544851303100586, 21.45720672607422, 22.36956214904785, 23.281917572021484, 24.194272994995117, 25.10662841796875, 26.018983840942383, 26.931339263916016, 27.843692779541016, 28.75604820251465, 29.66840362548828, 30.580759048461914, 31.493114471435547]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 10.0, 8.0, 10.0, 11.0, 6.0, 8.0, 26.0, 13.0, 17.0, 24.0, 28.0, 37.0, 31.0, 33.0, 35.0, 40.0, 36.0, 46.0, 43.0, 47.0, 44.0, 48.0, 43.0, 32.0, 40.0, 26.0, 27.0, 35.0, 26.0, 25.0, 29.0, 19.0, 14.0, 17.0, 8.0, 15.0, 12.0, 10.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -3.9979248046875, -3.863037109375, -3.7281494140625, -3.59326171875, -3.4583740234375, -3.323486328125, -3.1885986328125, -3.0537109375, -2.9188232421875, -2.783935546875, -2.6490478515625, -2.51416015625, -2.3792724609375, -2.244384765625, -2.1094970703125, -1.974609375, -1.8397216796875, -1.704833984375, -1.5699462890625, -1.43505859375, -1.3001708984375, -1.165283203125, -1.0303955078125, -0.8955078125, -0.7606201171875, -0.625732421875, -0.4908447265625, -0.35595703125, -0.2210693359375, -0.086181640625, 0.0487060546875, 0.18359375, 0.3184814453125, 0.453369140625, 0.5882568359375, 0.72314453125, 0.8580322265625, 0.992919921875, 1.1278076171875, 1.2626953125, 1.3975830078125, 1.532470703125, 1.6673583984375, 1.80224609375, 1.9371337890625, 2.072021484375, 2.2069091796875, 2.341796875, 2.4766845703125, 2.611572265625, 2.7464599609375, 2.88134765625, 3.0162353515625, 3.151123046875, 3.2860107421875, 3.4208984375, 3.5557861328125, 3.690673828125, 3.8255615234375, 3.96044921875, 4.0953369140625, 4.230224609375, 4.3651123046875, 4.5]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 11.0, 12.0, 14.0, 23.0, 29.0, 28.0, 35.0, 56.0, 68.0, 87.0, 104.0, 166.0, 212.0, 311.0, 498.0, 1098.0, 5178.0, 79619.0, 1155950.0, 2472550.0, 449604.0, 23942.0, 2449.0, 768.0, 430.0, 261.0, 186.0, 143.0, 86.0, 78.0, 58.0, 62.0, 29.0, 32.0, 24.0, 20.0, 15.0, 9.0, 8.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.171875, -7.9107666015625, -7.649658203125, -7.3885498046875, -7.12744140625, -6.8663330078125, -6.605224609375, -6.3441162109375, -6.0830078125, -5.8218994140625, -5.560791015625, -5.2996826171875, -5.03857421875, -4.7774658203125, -4.516357421875, -4.2552490234375, -3.994140625, -3.7330322265625, -3.471923828125, -3.2108154296875, -2.94970703125, -2.6885986328125, -2.427490234375, -2.1663818359375, -1.9052734375, -1.6441650390625, -1.383056640625, -1.1219482421875, -0.86083984375, -0.5997314453125, -0.338623046875, -0.0775146484375, 0.18359375, 0.4447021484375, 0.705810546875, 0.9669189453125, 1.22802734375, 1.4891357421875, 1.750244140625, 2.0113525390625, 2.2724609375, 2.5335693359375, 2.794677734375, 3.0557861328125, 3.31689453125, 3.5780029296875, 3.839111328125, 4.1002197265625, 4.361328125, 4.6224365234375, 4.883544921875, 5.1446533203125, 5.40576171875, 5.6668701171875, 5.927978515625, 6.1890869140625, 6.4501953125, 6.7113037109375, 6.972412109375, 7.2335205078125, 7.49462890625, 7.7557373046875, 8.016845703125, 8.2779541015625, 8.5390625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 7.0, 5.0, 6.0, 12.0, 12.0, 30.0, 35.0, 47.0, 57.0, 80.0, 111.0, 148.0, 217.0, 273.0, 351.0, 418.0, 436.0, 387.0, 399.0, 281.0, 202.0, 153.0, 106.0, 75.0, 45.0, 48.0, 31.0, 26.0, 22.0, 10.0, 7.0, 5.0, 7.0, 2.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.2890625, -6.1016845703125, -5.914306640625, -5.7269287109375, -5.53955078125, -5.3521728515625, -5.164794921875, -4.9774169921875, -4.7900390625, -4.6026611328125, -4.415283203125, -4.2279052734375, -4.04052734375, -3.8531494140625, -3.665771484375, -3.4783935546875, -3.291015625, -3.1036376953125, -2.916259765625, -2.7288818359375, -2.54150390625, -2.3541259765625, -2.166748046875, -1.9793701171875, -1.7919921875, -1.6046142578125, -1.417236328125, -1.2298583984375, -1.04248046875, -0.8551025390625, -0.667724609375, -0.4803466796875, -0.29296875, -0.1055908203125, 0.081787109375, 0.2691650390625, 0.45654296875, 0.6439208984375, 0.831298828125, 1.0186767578125, 1.2060546875, 1.3934326171875, 1.580810546875, 1.7681884765625, 1.95556640625, 2.1429443359375, 2.330322265625, 2.5177001953125, 2.705078125, 2.8924560546875, 3.079833984375, 3.2672119140625, 3.45458984375, 3.6419677734375, 3.829345703125, 4.0167236328125, 4.2041015625, 4.3914794921875, 4.578857421875, 4.7662353515625, 4.95361328125, 5.1409912109375, 5.328369140625, 5.5157470703125, 5.703125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 6.0, 7.0, 7.0, 11.0, 15.0, 20.0, 36.0, 44.0, 64.0, 84.0, 109.0, 175.0, 284.0, 469.0, 784.0, 1983.0, 9690.0, 201338.0, 3544626.0, 414776.0, 14974.0, 2391.0, 880.0, 474.0, 325.0, 190.0, 141.0, 95.0, 83.0, 45.0, 33.0, 30.0, 29.0, 12.0, 10.0, 7.0, 11.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.8046875, -14.3360595703125, -13.867431640625, -13.3988037109375, -12.93017578125, -12.4615478515625, -11.992919921875, -11.5242919921875, -11.0556640625, -10.5870361328125, -10.118408203125, -9.6497802734375, -9.18115234375, -8.7125244140625, -8.243896484375, -7.7752685546875, -7.306640625, -6.8380126953125, -6.369384765625, -5.9007568359375, -5.43212890625, -4.9635009765625, -4.494873046875, -4.0262451171875, -3.5576171875, -3.0889892578125, -2.620361328125, -2.1517333984375, -1.68310546875, -1.2144775390625, -0.745849609375, -0.2772216796875, 0.19140625, 0.6600341796875, 1.128662109375, 1.5972900390625, 2.06591796875, 2.5345458984375, 3.003173828125, 3.4718017578125, 3.9404296875, 4.4090576171875, 4.877685546875, 5.3463134765625, 5.81494140625, 6.2835693359375, 6.752197265625, 7.2208251953125, 7.689453125, 8.1580810546875, 8.626708984375, 9.0953369140625, 9.56396484375, 10.0325927734375, 10.501220703125, 10.9698486328125, 11.4384765625, 11.9071044921875, 12.375732421875, 12.8443603515625, 13.31298828125, 13.7816162109375, 14.250244140625, 14.7188720703125, 15.1875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 298.0, 716.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-725.9168701171875, -710.8220825195312, -695.727294921875, -680.6325073242188, -665.5377197265625, -650.4429321289062, -635.34814453125, -620.2533569335938, -605.1585693359375, -590.0637817382812, -574.968994140625, -559.8742065429688, -544.7794189453125, -529.6846313476562, -514.58984375, -499.49505615234375, -484.4002380371094, -469.3054504394531, -454.2106628417969, -439.1158752441406, -424.0210876464844, -408.9263000488281, -393.83148193359375, -378.7366943359375, -363.64190673828125, -348.547119140625, -333.45233154296875, -318.3575439453125, -303.26275634765625, -288.16796875, -273.07318115234375, -257.9783935546875, -242.88357543945312, -227.78878784179688, -212.69400024414062, -197.59921264648438, -182.50442504882812, -167.40963745117188, -152.31483459472656, -137.2200469970703, -122.12525939941406, -107.03047180175781, -91.93568420410156, -76.84088897705078, -61.74610137939453, -46.65131378173828, -31.5565185546875, -16.46173095703125, -1.366943359375, 13.727846145629883, 28.822635650634766, 43.91742706298828, 59.01221466064453, 74.10700225830078, 89.20179748535156, 104.29658508300781, 119.39137268066406, 134.4861602783203, 149.58094787597656, 164.67575073242188, 179.77053833007812, 194.86532592773438, 209.96011352539062, 225.05490112304688, 240.14968872070312]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 17.0, 11.0, 18.0, 26.0, 29.0, 23.0, 42.0, 37.0, 36.0, 48.0, 56.0, 65.0, 68.0, 62.0, 46.0, 55.0, 56.0, 49.0, 46.0, 34.0, 36.0, 34.0, 26.0, 21.0, 16.0, 13.0, 7.0, 12.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.70359992980957, -19.747283935546875, -18.790969848632812, -17.834653854370117, -16.878337860107422, -15.922021865844727, -14.965706825256348, -14.009391784667969, -13.053075790405273, -12.096759796142578, -11.1404447555542, -10.18412971496582, -9.227813720703125, -8.27149772644043, -7.315182685852051, -6.358867168426514, -5.402551651000977, -4.4462361335754395, -3.4899206161499023, -2.5336050987243652, -1.5772895812988281, -0.620974063873291, 0.3353414535522461, 1.2916569709777832, 2.2479724884033203, 3.2042880058288574, 4.1606035232543945, 5.116919040679932, 6.073234558105469, 7.029550075531006, 7.985865592956543, 8.942180633544922, 9.89849853515625, 10.854814529418945, 11.811129570007324, 12.767444610595703, 13.723760604858398, 14.680076599121094, 15.636391639709473, 16.59270668029785, 17.549022674560547, 18.505338668823242, 19.461654663085938, 20.41796875, 21.374284744262695, 22.33060073852539, 23.286914825439453, 24.24323081970215, 25.199546813964844, 26.15586280822754, 27.112178802490234, 28.068492889404297, 29.024808883666992, 29.981124877929688, 30.93743896484375, 31.893754959106445, 32.85007095336914, 33.8063850402832, 34.76270294189453, 35.719017028808594, 36.675331115722656, 37.631649017333984, 38.58796310424805, 39.544281005859375, 40.50059509277344]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 8.0, 13.0, 13.0, 14.0, 12.0, 17.0, 20.0, 18.0, 20.0, 29.0, 34.0, 47.0, 35.0, 31.0, 39.0, 36.0, 46.0, 40.0, 38.0, 50.0, 54.0, 42.0, 37.0, 30.0, 44.0, 35.0, 23.0, 29.0, 23.0, 21.0, 15.0, 15.0, 14.0, 13.0, 10.0, 6.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.8138427734375, -3.678466796875, -3.5430908203125, -3.40771484375, -3.2723388671875, -3.136962890625, -3.0015869140625, -2.8662109375, -2.7308349609375, -2.595458984375, -2.4600830078125, -2.32470703125, -2.1893310546875, -2.053955078125, -1.9185791015625, -1.783203125, -1.6478271484375, -1.512451171875, -1.3770751953125, -1.24169921875, -1.1063232421875, -0.970947265625, -0.8355712890625, -0.7001953125, -0.5648193359375, -0.429443359375, -0.2940673828125, -0.15869140625, -0.0233154296875, 0.112060546875, 0.2474365234375, 0.3828125, 0.5181884765625, 0.653564453125, 0.7889404296875, 0.92431640625, 1.0596923828125, 1.195068359375, 1.3304443359375, 1.4658203125, 1.6011962890625, 1.736572265625, 1.8719482421875, 2.00732421875, 2.1427001953125, 2.278076171875, 2.4134521484375, 2.548828125, 2.6842041015625, 2.819580078125, 2.9549560546875, 3.09033203125, 3.2257080078125, 3.361083984375, 3.4964599609375, 3.6318359375, 3.7672119140625, 3.902587890625, 4.0379638671875, 4.17333984375, 4.3087158203125, 4.444091796875, 4.5794677734375, 4.71484375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 12.0, 8.0, 18.0, 26.0, 35.0, 57.0, 79.0, 114.0, 187.0, 290.0, 414.0, 590.0, 915.0, 1372.0, 2047.0, 3087.0, 4781.0, 7158.0, 11249.0, 17985.0, 29475.0, 49940.0, 89441.0, 179743.0, 298882.0, 154125.0, 79053.0, 44694.0, 26497.0, 16564.0, 10206.0, 6581.0, 4342.0, 2820.0, 1944.0, 1249.0, 832.0, 593.0, 375.0, 227.0, 180.0, 120.0, 75.0, 49.0, 39.0, 29.0, 19.0, 11.0, 9.0, 7.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.82958984375, -0.8054733276367188, -0.7813568115234375, -0.7572402954101562, -0.733123779296875, -0.7090072631835938, -0.6848907470703125, -0.6607742309570312, -0.63665771484375, -0.6125411987304688, -0.5884246826171875, -0.5643081665039062, -0.540191650390625, -0.5160751342773438, -0.4919586181640625, -0.46784210205078125, -0.4437255859375, -0.41960906982421875, -0.3954925537109375, -0.37137603759765625, -0.347259521484375, -0.32314300537109375, -0.2990264892578125, -0.27490997314453125, -0.25079345703125, -0.22667694091796875, -0.2025604248046875, -0.17844390869140625, -0.154327392578125, -0.13021087646484375, -0.1060943603515625, -0.08197784423828125, -0.057861328125, -0.03374481201171875, -0.0096282958984375, 0.01448822021484375, 0.038604736328125, 0.06272125244140625, 0.0868377685546875, 0.11095428466796875, 0.13507080078125, 0.15918731689453125, 0.1833038330078125, 0.20742034912109375, 0.231536865234375, 0.25565338134765625, 0.2797698974609375, 0.30388641357421875, 0.3280029296875, 0.35211944580078125, 0.3762359619140625, 0.40035247802734375, 0.424468994140625, 0.44858551025390625, 0.4727020263671875, 0.49681854248046875, 0.52093505859375, 0.5450515747070312, 0.5691680908203125, 0.5932846069335938, 0.617401123046875, 0.6415176391601562, 0.6656341552734375, 0.6897506713867188, 0.7138671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 6.0, 4.0, 13.0, 12.0, 14.0, 14.0, 6.0, 19.0, 14.0, 18.0, 32.0, 31.0, 28.0, 29.0, 44.0, 41.0, 28.0, 35.0, 41.0, 36.0, 1060.0, 51.0, 43.0, 38.0, 36.0, 34.0, 35.0, 37.0, 25.0, 32.0, 22.0, 14.0, 13.0, 15.0, 13.0, 13.0, 11.0, 17.0, 7.0, 7.0, 8.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.455078125, -2.374176025390625, -2.29327392578125, -2.212371826171875, -2.1314697265625, -2.050567626953125, -1.96966552734375, -1.888763427734375, -1.807861328125, -1.726959228515625, -1.64605712890625, -1.565155029296875, -1.4842529296875, -1.403350830078125, -1.32244873046875, -1.241546630859375, -1.16064453125, -1.079742431640625, -0.99884033203125, -0.917938232421875, -0.8370361328125, -0.756134033203125, -0.67523193359375, -0.594329833984375, -0.513427734375, -0.432525634765625, -0.35162353515625, -0.270721435546875, -0.1898193359375, -0.108917236328125, -0.02801513671875, 0.052886962890625, 0.1337890625, 0.214691162109375, 0.29559326171875, 0.376495361328125, 0.4573974609375, 0.538299560546875, 0.61920166015625, 0.700103759765625, 0.781005859375, 0.861907958984375, 0.94281005859375, 1.023712158203125, 1.1046142578125, 1.185516357421875, 1.26641845703125, 1.347320556640625, 1.42822265625, 1.509124755859375, 1.59002685546875, 1.670928955078125, 1.7518310546875, 1.832733154296875, 1.91363525390625, 1.994537353515625, 2.075439453125, 2.156341552734375, 2.23724365234375, 2.318145751953125, 2.3990478515625, 2.479949951171875, 2.56085205078125, 2.641754150390625, 2.72265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 8.0, 6.0, 13.0, 16.0, 32.0, 45.0, 56.0, 91.0, 125.0, 195.0, 281.0, 416.0, 547.0, 822.0, 1167.0, 1771.0, 2484.0, 3607.0, 5179.0, 7815.0, 11739.0, 18111.0, 28713.0, 47456.0, 83202.0, 159637.0, 1352769.0, 158230.0, 82793.0, 46882.0, 28580.0, 18002.0, 11600.0, 7689.0, 5158.0, 3730.0, 2492.0, 1848.0, 1242.0, 805.0, 566.0, 424.0, 255.0, 196.0, 119.0, 69.0, 54.0, 48.0, 18.0, 11.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68701171875, -0.6644821166992188, -0.6419525146484375, -0.6194229125976562, -0.596893310546875, -0.5743637084960938, -0.5518341064453125, -0.5293045043945312, -0.50677490234375, -0.48424530029296875, -0.4617156982421875, -0.43918609619140625, -0.416656494140625, -0.39412689208984375, -0.3715972900390625, -0.34906768798828125, -0.3265380859375, -0.30400848388671875, -0.2814788818359375, -0.25894927978515625, -0.236419677734375, -0.21389007568359375, -0.1913604736328125, -0.16883087158203125, -0.14630126953125, -0.12377166748046875, -0.1012420654296875, -0.07871246337890625, -0.056182861328125, -0.03365325927734375, -0.0111236572265625, 0.01140594482421875, 0.033935546875, 0.05646514892578125, 0.0789947509765625, 0.10152435302734375, 0.124053955078125, 0.14658355712890625, 0.1691131591796875, 0.19164276123046875, 0.21417236328125, 0.23670196533203125, 0.2592315673828125, 0.28176116943359375, 0.304290771484375, 0.32682037353515625, 0.3493499755859375, 0.37187957763671875, 0.3944091796875, 0.41693878173828125, 0.4394683837890625, 0.46199798583984375, 0.484527587890625, 0.5070571899414062, 0.5295867919921875, 0.5521163940429688, 0.57464599609375, 0.5971755981445312, 0.6197052001953125, 0.6422348022460938, 0.664764404296875, 0.6872940063476562, 0.7098236083984375, 0.7323532104492188, 0.7548828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 12.0, 10.0, 9.0, 10.0, 12.0, 15.0, 18.0, 16.0, 31.0, 22.0, 32.0, 29.0, 33.0, 46.0, 44.0, 52.0, 48.0, 52.0, 54.0, 52.0, 39.0, 49.0, 38.0, 35.0, 35.0, 35.0, 18.0, 26.0, 25.0, 11.0, 17.0, 7.0, 17.0, 4.0, 6.0, 9.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00043773651123046875, -0.0004251226782798767, -0.00041250884532928467, -0.0003998950123786926, -0.0003872811794281006, -0.00037466734647750854, -0.0003620535135269165, -0.00034943968057632446, -0.0003368258476257324, -0.0003242120146751404, -0.00031159818172454834, -0.0002989843487739563, -0.00028637051582336426, -0.0002737566828727722, -0.0002611428499221802, -0.00024852901697158813, -0.0002359151840209961, -0.00022330135107040405, -0.000210687518119812, -0.00019807368516921997, -0.00018545985221862793, -0.0001728460192680359, -0.00016023218631744385, -0.0001476183533668518, -0.00013500452041625977, -0.00012239068746566772, -0.00010977685451507568, -9.716302156448364e-05, -8.45491886138916e-05, -7.193535566329956e-05, -5.932152271270752e-05, -4.670768976211548e-05, -3.409385681152344e-05, -2.1480023860931396e-05, -8.866190910339355e-06, 3.7476420402526855e-06, 1.6361474990844727e-05, 2.8975307941436768e-05, 4.158914089202881e-05, 5.420297384262085e-05, 6.681680679321289e-05, 7.943063974380493e-05, 9.204447269439697e-05, 0.00010465830564498901, 0.00011727213859558105, 0.0001298859715461731, 0.00014249980449676514, 0.00015511363744735718, 0.00016772747039794922, 0.00018034130334854126, 0.0001929551362991333, 0.00020556896924972534, 0.00021818280220031738, 0.00023079663515090942, 0.00024341046810150146, 0.0002560243010520935, 0.00026863813400268555, 0.0002812519669532776, 0.00029386579990386963, 0.00030647963285446167, 0.0003190934658050537, 0.00033170729875564575, 0.0003443211317062378, 0.00035693496465682983, 0.0003695487976074219]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 12.0, 14.0, 8.0, 8.0, 23.0, 23.0, 27.0, 27.0, 36.0, 39.0, 55.0, 73.0, 84.0, 131.0, 179.0, 228.0, 418.0, 700.0, 2545.0, 970600.0, 70479.0, 1149.0, 527.0, 342.0, 193.0, 138.0, 94.0, 71.0, 60.0, 48.0, 36.0, 40.0, 25.0, 29.0, 17.0, 21.0, 9.0, 4.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.007114410400390625, -0.006867110729217529, -0.006619811058044434, -0.006372511386871338, -0.006125211715698242, -0.0058779120445251465, -0.005630612373352051, -0.005383312702178955, -0.005136013031005859, -0.004888713359832764, -0.004641413688659668, -0.004394114017486572, -0.0041468143463134766, -0.003899514675140381, -0.003652215003967285, -0.0034049153327941895, -0.0031576156616210938, -0.002910315990447998, -0.0026630163192749023, -0.0024157166481018066, -0.002168416976928711, -0.0019211173057556152, -0.0016738176345825195, -0.0014265179634094238, -0.0011792182922363281, -0.0009319186210632324, -0.0006846189498901367, -0.000437319278717041, -0.0001900196075439453, 5.728006362915039e-05, 0.0003045797348022461, 0.0005518794059753418, 0.0007991790771484375, 0.0010464787483215332, 0.001293778419494629, 0.0015410780906677246, 0.0017883777618408203, 0.002035677433013916, 0.0022829771041870117, 0.0025302767753601074, 0.002777576446533203, 0.003024876117706299, 0.0032721757888793945, 0.0035194754600524902, 0.003766775131225586, 0.004014074802398682, 0.004261374473571777, 0.004508674144744873, 0.004755973815917969, 0.0050032734870910645, 0.00525057315826416, 0.005497872829437256, 0.0057451725006103516, 0.005992472171783447, 0.006239771842956543, 0.006487071514129639, 0.006734371185302734, 0.00698167085647583, 0.007228970527648926, 0.0074762701988220215, 0.007723569869995117, 0.007970869541168213, 0.008218169212341309, 0.008465468883514404, 0.0087127685546875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 31.0, 435.0, 511.0, 37.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.002659361809492111, -0.002613550052046776, -0.002567738527432084, -0.0025219267699867487, -0.002476115245372057, -0.0024303034879267216, -0.00238449196331203, -0.0023386802058666945, -0.0022928686812520027, -0.0022470569238066673, -0.0022012453991919756, -0.00215543364174664, -0.0021096221171319485, -0.002063810359686613, -0.0020179988350719213, -0.001972187077626586, -0.0019263753201812506, -0.001880563679151237, -0.0018347520381212234, -0.0017889403970912099, -0.0017431287560611963, -0.001697316998615861, -0.0016515054740011692, -0.0016056937165558338, -0.001559882191941142, -0.0015140705509111285, -0.001468258909881115, -0.0014224472688511014, -0.0013766356278210878, -0.0013308238703757524, -0.0012850123457610607, -0.0012392005883157253, -0.00119338883087039, -0.0011475771898403764, -0.0011017655488103628, -0.0010559539077803493, -0.0010101422667503357, -0.0009643305675126612, -0.0009185189264826477, -0.0008727072272449732, -0.0008268957026302814, -0.0007810840616002679, -0.0007352724205702543, -0.0006894607795402408, -0.0006436490803025663, -0.0005978374392725527, -0.0005520257982425392, -0.0005062140990048647, -0.00046040245797485113, -0.00041459081694483757, -0.00036877914681099355, -0.00032296750578098, -0.000277155835647136, -0.0002313441946171224, -0.00018553255358710885, -0.00013972088345326483, -9.390924242325127e-05, -4.809759047930129e-05, -2.285938535351306e-06, 4.352570977061987e-05, 8.933736535254866e-05, 0.00013514902093447745, 0.000180960661964491, 0.00022677233209833503, 0.0002725839731283486]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 5.0, 11.0, 7.0, 5.0, 17.0, 22.0, 16.0, 25.0, 16.0, 23.0, 24.0, 37.0, 33.0, 33.0, 41.0, 61.0, 36.0, 37.0, 51.0, 38.0, 50.0, 54.0, 48.0, 34.0, 32.0, 28.0, 35.0, 31.0, 23.0, 15.0, 22.0, 15.0, 14.0, 9.0, 7.0, 7.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022673606872558594, -0.00021886080503463745, -0.00021098554134368896, -0.00020311027765274048, -0.000195235013961792, -0.0001873597502708435, -0.00017948448657989502, -0.00017160922288894653, -0.00016373395919799805, -0.00015585869550704956, -0.00014798343181610107, -0.0001401081681251526, -0.0001322329044342041, -0.00012435764074325562, -0.00011648237705230713, -0.00010860711336135864, -0.00010073184967041016, -9.285658597946167e-05, -8.498132228851318e-05, -7.71060585975647e-05, -6.923079490661621e-05, -6.135553121566772e-05, -5.348026752471924e-05, -4.560500383377075e-05, -3.7729740142822266e-05, -2.985447645187378e-05, -2.1979212760925293e-05, -1.4103949069976807e-05, -6.22868537902832e-06, 1.646578311920166e-06, 9.521842002868652e-06, 1.739710569381714e-05, 2.5272369384765625e-05, 3.314763307571411e-05, 4.10228967666626e-05, 4.8898160457611084e-05, 5.677342414855957e-05, 6.464868783950806e-05, 7.252395153045654e-05, 8.039921522140503e-05, 8.827447891235352e-05, 9.6149742603302e-05, 0.00010402500629425049, 0.00011190026998519897, 0.00011977553367614746, 0.00012765079736709595, 0.00013552606105804443, 0.00014340132474899292, 0.0001512765884399414, 0.0001591518521308899, 0.00016702711582183838, 0.00017490237951278687, 0.00018277764320373535, 0.00019065290689468384, 0.00019852817058563232, 0.0002064034342765808, 0.0002142786979675293, 0.00022215396165847778, 0.00023002922534942627, 0.00023790448904037476, 0.00024577975273132324, 0.00025365501642227173, 0.0002615302801132202, 0.0002694055438041687, 0.0002772808074951172]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 8.0, 13.0, 13.0, 14.0, 12.0, 17.0, 20.0, 18.0, 20.0, 29.0, 34.0, 47.0, 35.0, 31.0, 39.0, 36.0, 46.0, 40.0, 38.0, 50.0, 54.0, 42.0, 37.0, 30.0, 43.0, 36.0, 23.0, 29.0, 23.0, 21.0, 15.0, 15.0, 14.0, 13.0, 10.0, 6.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.8138427734375, -3.678466796875, -3.5430908203125, -3.40771484375, -3.2723388671875, -3.136962890625, -3.0015869140625, -2.8662109375, -2.7308349609375, -2.595458984375, -2.4600830078125, -2.32470703125, -2.1893310546875, -2.053955078125, -1.9185791015625, -1.783203125, -1.6478271484375, -1.512451171875, -1.3770751953125, -1.24169921875, -1.1063232421875, -0.970947265625, -0.8355712890625, -0.7001953125, -0.5648193359375, -0.429443359375, -0.2940673828125, -0.15869140625, -0.0233154296875, 0.112060546875, 0.2474365234375, 0.3828125, 0.5181884765625, 0.653564453125, 0.7889404296875, 0.92431640625, 1.0596923828125, 1.195068359375, 1.3304443359375, 1.4658203125, 1.6011962890625, 1.736572265625, 1.8719482421875, 2.00732421875, 2.1427001953125, 2.278076171875, 2.4134521484375, 2.548828125, 2.6842041015625, 2.819580078125, 2.9549560546875, 3.09033203125, 3.2257080078125, 3.361083984375, 3.4964599609375, 3.6318359375, 3.7672119140625, 3.902587890625, 4.0379638671875, 4.17333984375, 4.3087158203125, 4.444091796875, 4.5794677734375, 4.71484375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 15.0, 10.0, 15.0, 23.0, 48.0, 40.0, 57.0, 75.0, 99.0, 120.0, 169.0, 290.0, 421.0, 893.0, 1683.0, 3709.0, 9712.0, 28017.0, 83446.0, 264314.0, 415483.0, 159047.0, 51508.0, 17206.0, 6406.0, 2625.0, 1260.0, 609.0, 389.0, 225.0, 174.0, 103.0, 91.0, 60.0, 52.0, 40.0, 27.0, 29.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6484375, -4.48406982421875, -4.3197021484375, -4.15533447265625, -3.990966796875, -3.82659912109375, -3.6622314453125, -3.49786376953125, -3.33349609375, -3.16912841796875, -3.0047607421875, -2.84039306640625, -2.676025390625, -2.51165771484375, -2.3472900390625, -2.18292236328125, -2.0185546875, -1.85418701171875, -1.6898193359375, -1.52545166015625, -1.361083984375, -1.19671630859375, -1.0323486328125, -0.86798095703125, -0.70361328125, -0.53924560546875, -0.3748779296875, -0.21051025390625, -0.046142578125, 0.11822509765625, 0.2825927734375, 0.44696044921875, 0.611328125, 0.77569580078125, 0.9400634765625, 1.10443115234375, 1.268798828125, 1.43316650390625, 1.5975341796875, 1.76190185546875, 1.92626953125, 2.09063720703125, 2.2550048828125, 2.41937255859375, 2.583740234375, 2.74810791015625, 2.9124755859375, 3.07684326171875, 3.2412109375, 3.40557861328125, 3.5699462890625, 3.73431396484375, 3.898681640625, 4.06304931640625, 4.2274169921875, 4.39178466796875, 4.55615234375, 4.72052001953125, 4.8848876953125, 5.04925537109375, 5.213623046875, 5.37799072265625, 5.5423583984375, 5.70672607421875, 5.87109375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 9.0, 6.0, 6.0, 16.0, 23.0, 13.0, 20.0, 15.0, 26.0, 30.0, 31.0, 35.0, 30.0, 41.0, 43.0, 71.0, 105.0, 254.0, 1463.0, 230.0, 125.0, 82.0, 55.0, 45.0, 29.0, 32.0, 24.0, 32.0, 28.0, 22.0, 19.0, 19.0, 7.0, 6.0, 9.0, 7.0, 3.0, 6.0, 5.0, 8.0, 2.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0], "bins": [-13.9453125, -13.552490234375, -13.15966796875, -12.766845703125, -12.3740234375, -11.981201171875, -11.58837890625, -11.195556640625, -10.802734375, -10.409912109375, -10.01708984375, -9.624267578125, -9.2314453125, -8.838623046875, -8.44580078125, -8.052978515625, -7.66015625, -7.267333984375, -6.87451171875, -6.481689453125, -6.0888671875, -5.696044921875, -5.30322265625, -4.910400390625, -4.517578125, -4.124755859375, -3.73193359375, -3.339111328125, -2.9462890625, -2.553466796875, -2.16064453125, -1.767822265625, -1.375, -0.982177734375, -0.58935546875, -0.196533203125, 0.1962890625, 0.589111328125, 0.98193359375, 1.374755859375, 1.767578125, 2.160400390625, 2.55322265625, 2.946044921875, 3.3388671875, 3.731689453125, 4.12451171875, 4.517333984375, 4.91015625, 5.302978515625, 5.69580078125, 6.088623046875, 6.4814453125, 6.874267578125, 7.26708984375, 7.659912109375, 8.052734375, 8.445556640625, 8.83837890625, 9.231201171875, 9.6240234375, 10.016845703125, 10.40966796875, 10.802490234375, 11.1953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 7.0, 4.0, 12.0, 10.0, 13.0, 21.0, 22.0, 44.0, 56.0, 67.0, 101.0, 145.0, 240.0, 353.0, 608.0, 1188.0, 9514.0, 2306540.0, 818212.0, 5825.0, 1095.0, 563.0, 341.0, 223.0, 134.0, 91.0, 68.0, 60.0, 27.0, 22.0, 13.0, 15.0, 18.0, 6.0, 7.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.765625, -23.989990234375, -23.21435546875, -22.438720703125, -21.6630859375, -20.887451171875, -20.11181640625, -19.336181640625, -18.560546875, -17.784912109375, -17.00927734375, -16.233642578125, -15.4580078125, -14.682373046875, -13.90673828125, -13.131103515625, -12.35546875, -11.579833984375, -10.80419921875, -10.028564453125, -9.2529296875, -8.477294921875, -7.70166015625, -6.926025390625, -6.150390625, -5.374755859375, -4.59912109375, -3.823486328125, -3.0478515625, -2.272216796875, -1.49658203125, -0.720947265625, 0.0546875, 0.830322265625, 1.60595703125, 2.381591796875, 3.1572265625, 3.932861328125, 4.70849609375, 5.484130859375, 6.259765625, 7.035400390625, 7.81103515625, 8.586669921875, 9.3623046875, 10.137939453125, 10.91357421875, 11.689208984375, 12.46484375, 13.240478515625, 14.01611328125, 14.791748046875, 15.5673828125, 16.343017578125, 17.11865234375, 17.894287109375, 18.669921875, 19.445556640625, 20.22119140625, 20.996826171875, 21.7724609375, 22.548095703125, 23.32373046875, 24.099365234375, 24.875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 680.0, 331.0, 0.0, 0.0, 1.0], "bins": [-405.9640197753906, -399.18408203125, -392.4041442871094, -385.62420654296875, -378.84423828125, -372.0643005371094, -365.28436279296875, -358.5044250488281, -351.7244873046875, -344.9445495605469, -338.16461181640625, -331.3846435546875, -324.6047058105469, -317.82476806640625, -311.0448303222656, -304.264892578125, -297.48492431640625, -290.7049865722656, -283.925048828125, -277.14508056640625, -270.3651428222656, -263.585205078125, -256.8052673339844, -250.02532958984375, -243.24539184570312, -236.4654541015625, -229.6855010986328, -222.9055633544922, -216.12562561035156, -209.34567260742188, -202.56573486328125, -195.78579711914062, -189.005859375, -182.22592163085938, -175.4459686279297, -168.66603088378906, -161.88609313964844, -155.10614013671875, -148.32620239257812, -141.5462646484375, -134.7663116455078, -127.98636627197266, -121.20642852783203, -114.42648315429688, -107.64654541015625, -100.8666000366211, -94.08665466308594, -87.30671691894531, -80.52677154541016, -73.746826171875, -66.96688842773438, -60.18694305419922, -53.40700149536133, -46.62705993652344, -39.84711456298828, -33.06717300415039, -26.287233352661133, -19.50728988647461, -12.727348327636719, -5.947404861450195, 0.8325366973876953, 7.612478256225586, 14.392423629760742, 21.172365188598633, 27.952306747436523]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 12.0, 12.0, 12.0, 13.0, 16.0, 29.0, 17.0, 27.0, 26.0, 27.0, 34.0, 43.0, 50.0, 39.0, 37.0, 47.0, 47.0, 47.0, 45.0, 40.0, 37.0, 43.0, 32.0, 40.0, 38.0, 22.0, 27.0, 25.0, 19.0, 16.0, 15.0, 15.0, 9.0, 5.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.35944366455078, -23.451749801635742, -22.544055938720703, -21.63636016845703, -20.728666305541992, -19.820972442626953, -18.913278579711914, -18.005584716796875, -17.097890853881836, -16.190196990966797, -15.282502174377441, -14.374808311462402, -13.467114448547363, -12.559419631958008, -11.651725769042969, -10.74403190612793, -9.836337089538574, -8.928643226623535, -8.02094841003418, -7.113254547119141, -6.205560684204102, -5.297866344451904, -4.390172004699707, -3.482478141784668, -2.5747838020324707, -1.6670897006988525, -0.7593954801559448, 0.1482987403869629, 1.055992841720581, 1.9636869430541992, 2.8713812828063965, 3.7790751457214355, 4.686769485473633, 5.59446382522583, 6.502157688140869, 7.409852027893066, 8.317545890808105, 9.225240707397461, 10.1329345703125, 11.040628433227539, 11.948322296142578, 12.856016159057617, 13.763710975646973, 14.671404838562012, 15.57909870147705, 16.486793518066406, 17.394487380981445, 18.302181243896484, 19.209877014160156, 20.117570877075195, 21.025264739990234, 21.932960510253906, 22.840654373168945, 23.748348236083984, 24.656042098999023, 25.563735961914062, 26.4714298248291, 27.37912368774414, 28.28681755065918, 29.19451141357422, 30.10220718383789, 31.00990104675293, 31.91759490966797, 32.825286865234375, 33.73298263549805]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 9.0, 14.0, 5.0, 7.0, 8.0, 14.0, 18.0, 23.0, 21.0, 24.0, 20.0, 24.0, 33.0, 28.0, 33.0, 29.0, 38.0, 37.0, 37.0, 48.0, 47.0, 40.0, 48.0, 43.0, 35.0, 35.0, 36.0, 26.0, 26.0, 26.0, 23.0, 32.0, 8.0, 24.0, 17.0, 12.0, 6.0, 12.0, 8.0, 3.0, 7.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.748046875, -3.620086669921875, -3.49212646484375, -3.364166259765625, -3.2362060546875, -3.108245849609375, -2.98028564453125, -2.852325439453125, -2.724365234375, -2.596405029296875, -2.46844482421875, -2.340484619140625, -2.2125244140625, -2.084564208984375, -1.95660400390625, -1.828643798828125, -1.70068359375, -1.572723388671875, -1.44476318359375, -1.316802978515625, -1.1888427734375, -1.060882568359375, -0.93292236328125, -0.804962158203125, -0.677001953125, -0.549041748046875, -0.42108154296875, -0.293121337890625, -0.1651611328125, -0.037200927734375, 0.09075927734375, 0.218719482421875, 0.3466796875, 0.474639892578125, 0.60260009765625, 0.730560302734375, 0.8585205078125, 0.986480712890625, 1.11444091796875, 1.242401123046875, 1.370361328125, 1.498321533203125, 1.62628173828125, 1.754241943359375, 1.8822021484375, 2.010162353515625, 2.13812255859375, 2.266082763671875, 2.39404296875, 2.522003173828125, 2.64996337890625, 2.777923583984375, 2.9058837890625, 3.033843994140625, 3.16180419921875, 3.289764404296875, 3.417724609375, 3.545684814453125, 3.67364501953125, 3.801605224609375, 3.9295654296875, 4.057525634765625, 4.18548583984375, 4.313446044921875, 4.44140625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 8.0, 5.0, 6.0, 5.0, 8.0, 8.0, 9.0, 9.0, 19.0, 25.0, 36.0, 23.0, 40.0, 69.0, 80.0, 129.0, 206.0, 360.0, 563.0, 1405.0, 4516.0, 20905.0, 122263.0, 625253.0, 1673659.0, 1301606.0, 363675.0, 63353.0, 10911.0, 2817.0, 1002.0, 481.0, 229.0, 171.0, 89.0, 73.0, 64.0, 49.0, 28.0, 29.0, 24.0, 15.0, 8.0, 17.0, 5.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44140625, -4.28173828125, -4.1220703125, -3.96240234375, -3.802734375, -3.64306640625, -3.4833984375, -3.32373046875, -3.1640625, -3.00439453125, -2.8447265625, -2.68505859375, -2.525390625, -2.36572265625, -2.2060546875, -2.04638671875, -1.88671875, -1.72705078125, -1.5673828125, -1.40771484375, -1.248046875, -1.08837890625, -0.9287109375, -0.76904296875, -0.609375, -0.44970703125, -0.2900390625, -0.13037109375, 0.029296875, 0.18896484375, 0.3486328125, 0.50830078125, 0.66796875, 0.82763671875, 0.9873046875, 1.14697265625, 1.306640625, 1.46630859375, 1.6259765625, 1.78564453125, 1.9453125, 2.10498046875, 2.2646484375, 2.42431640625, 2.583984375, 2.74365234375, 2.9033203125, 3.06298828125, 3.22265625, 3.38232421875, 3.5419921875, 3.70166015625, 3.861328125, 4.02099609375, 4.1806640625, 4.34033203125, 4.5, 4.65966796875, 4.8193359375, 4.97900390625, 5.138671875, 5.29833984375, 5.4580078125, 5.61767578125, 5.77734375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 9.0, 14.0, 10.0, 21.0, 27.0, 30.0, 43.0, 54.0, 77.0, 129.0, 170.0, 241.0, 324.0, 429.0, 461.0, 450.0, 391.0, 311.0, 245.0, 171.0, 116.0, 75.0, 55.0, 47.0, 46.0, 29.0, 19.0, 18.0, 12.0, 8.0, 7.0, 6.0, 7.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.1953125, -5.0218505859375, -4.848388671875, -4.6749267578125, -4.50146484375, -4.3280029296875, -4.154541015625, -3.9810791015625, -3.8076171875, -3.6341552734375, -3.460693359375, -3.2872314453125, -3.11376953125, -2.9403076171875, -2.766845703125, -2.5933837890625, -2.419921875, -2.2464599609375, -2.072998046875, -1.8995361328125, -1.72607421875, -1.5526123046875, -1.379150390625, -1.2056884765625, -1.0322265625, -0.8587646484375, -0.685302734375, -0.5118408203125, -0.33837890625, -0.1649169921875, 0.008544921875, 0.1820068359375, 0.35546875, 0.5289306640625, 0.702392578125, 0.8758544921875, 1.04931640625, 1.2227783203125, 1.396240234375, 1.5697021484375, 1.7431640625, 1.9166259765625, 2.090087890625, 2.2635498046875, 2.43701171875, 2.6104736328125, 2.783935546875, 2.9573974609375, 3.130859375, 3.3043212890625, 3.477783203125, 3.6512451171875, 3.82470703125, 3.9981689453125, 4.171630859375, 4.3450927734375, 4.5185546875, 4.6920166015625, 4.865478515625, 5.0389404296875, 5.21240234375, 5.3858642578125, 5.559326171875, 5.7327880859375, 5.90625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 10.0, 4.0, 7.0, 15.0, 14.0, 16.0, 27.0, 47.0, 43.0, 61.0, 93.0, 153.0, 229.0, 431.0, 889.0, 2595.0, 11772.0, 82810.0, 1055865.0, 2727464.0, 273268.0, 29895.0, 5487.0, 1616.0, 612.0, 293.0, 190.0, 125.0, 63.0, 47.0, 36.0, 37.0, 16.0, 11.0, 18.0, 5.0, 7.0, 5.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.40625, -7.1129150390625, -6.819580078125, -6.5262451171875, -6.23291015625, -5.9395751953125, -5.646240234375, -5.3529052734375, -5.0595703125, -4.7662353515625, -4.472900390625, -4.1795654296875, -3.88623046875, -3.5928955078125, -3.299560546875, -3.0062255859375, -2.712890625, -2.4195556640625, -2.126220703125, -1.8328857421875, -1.53955078125, -1.2462158203125, -0.952880859375, -0.6595458984375, -0.3662109375, -0.0728759765625, 0.220458984375, 0.5137939453125, 0.80712890625, 1.1004638671875, 1.393798828125, 1.6871337890625, 1.98046875, 2.2738037109375, 2.567138671875, 2.8604736328125, 3.15380859375, 3.4471435546875, 3.740478515625, 4.0338134765625, 4.3271484375, 4.6204833984375, 4.913818359375, 5.2071533203125, 5.50048828125, 5.7938232421875, 6.087158203125, 6.3804931640625, 6.673828125, 6.9671630859375, 7.260498046875, 7.5538330078125, 7.84716796875, 8.1405029296875, 8.433837890625, 8.7271728515625, 9.0205078125, 9.3138427734375, 9.607177734375, 9.9005126953125, 10.19384765625, 10.4871826171875, 10.780517578125, 11.0738525390625, 11.3671875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 12.0, 89.0, 265.0, 371.0, 221.0, 41.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.562997817993164, -20.562423706054688, -18.56184959411621, -16.561275482177734, -14.560702323913574, -12.560128211975098, -10.559555053710938, -8.558980941772461, -6.558406829833984, -4.557832717895508, -2.5572590827941895, -0.5566854476928711, 1.4438886642456055, 3.444462776184082, 5.445035934448242, 7.445610046386719, 9.446184158325195, 11.446758270263672, 13.447332382202148, 15.447905540466309, 17.44847869873047, 19.449054718017578, 21.449626922607422, 23.4502010345459, 25.450775146484375, 27.45134925842285, 29.451923370361328, 31.452495574951172, 33.45307159423828, 35.453643798828125, 37.45421600341797, 39.45479202270508, 41.45536804199219, 43.45594024658203, 45.45651626586914, 47.457088470458984, 49.457664489746094, 51.45823669433594, 53.45880889892578, 55.45938491821289, 57.4599609375, 59.460533142089844, 61.46110916137695, 63.4616813659668, 65.4622573852539, 67.46282958984375, 69.4634017944336, 71.46397399902344, 73.46455383300781, 75.46512603759766, 77.4656982421875, 79.46627807617188, 81.46685028076172, 83.46742248535156, 85.4679946899414, 87.46856689453125, 89.4691390991211, 91.46971130371094, 93.47028350830078, 95.47086334228516, 97.471435546875, 99.47200775146484, 101.47257995605469, 103.47315979003906, 105.4737319946289]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 6.0, 10.0, 16.0, 9.0, 18.0, 13.0, 24.0, 21.0, 24.0, 34.0, 35.0, 32.0, 29.0, 40.0, 41.0, 41.0, 38.0, 47.0, 33.0, 40.0, 29.0, 42.0, 40.0, 49.0, 32.0, 22.0, 35.0, 29.0, 26.0, 19.0, 20.0, 20.0, 15.0, 8.0, 7.0, 10.0, 9.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.538654327392578, -19.92561149597168, -19.31256866455078, -18.699525833129883, -18.086483001708984, -17.473440170288086, -16.860397338867188, -16.24735450744629, -15.63431167602539, -15.021268844604492, -14.408226013183594, -13.795183181762695, -13.182140350341797, -12.569097518920898, -11.9560546875, -11.343011856079102, -10.729969024658203, -10.116926193237305, -9.503883361816406, -8.890840530395508, -8.27779769897461, -7.664754867553711, -7.0517120361328125, -6.438669204711914, -5.825626373291016, -5.212583541870117, -4.599540710449219, -3.9864978790283203, -3.373455047607422, -2.7604122161865234, -2.147369384765625, -1.5343265533447266, -0.9212818145751953, -0.3082389831542969, 0.30480384826660156, 0.9178466796875, 1.5308895111083984, 2.143932342529297, 2.7569751739501953, 3.3700180053710938, 3.983060836791992, 4.596103668212891, 5.209146499633789, 5.8221893310546875, 6.435232162475586, 7.048274993896484, 7.661317825317383, 8.274360656738281, 8.88740348815918, 9.500446319580078, 10.113489151000977, 10.726531982421875, 11.339574813842773, 11.952617645263672, 12.56566047668457, 13.178703308105469, 13.791746139526367, 14.404788970947266, 15.017831802368164, 15.630874633789062, 16.24391746520996, 16.85696029663086, 17.470003128051758, 18.083045959472656, 18.696088790893555]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 10.0, 6.0, 12.0, 9.0, 15.0, 16.0, 17.0, 17.0, 33.0, 21.0, 28.0, 27.0, 33.0, 33.0, 30.0, 41.0, 43.0, 32.0, 51.0, 44.0, 36.0, 37.0, 33.0, 42.0, 36.0, 36.0, 31.0, 28.0, 29.0, 27.0, 19.0, 20.0, 19.0, 10.0, 13.0, 8.0, 14.0, 10.0, 7.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.74310302734375, -3.6190185546875, -3.49493408203125, -3.370849609375, -3.24676513671875, -3.1226806640625, -2.99859619140625, -2.87451171875, -2.75042724609375, -2.6263427734375, -2.50225830078125, -2.378173828125, -2.25408935546875, -2.1300048828125, -2.00592041015625, -1.8818359375, -1.75775146484375, -1.6336669921875, -1.50958251953125, -1.385498046875, -1.26141357421875, -1.1373291015625, -1.01324462890625, -0.88916015625, -0.76507568359375, -0.6409912109375, -0.51690673828125, -0.392822265625, -0.26873779296875, -0.1446533203125, -0.02056884765625, 0.103515625, 0.22760009765625, 0.3516845703125, 0.47576904296875, 0.599853515625, 0.72393798828125, 0.8480224609375, 0.97210693359375, 1.09619140625, 1.22027587890625, 1.3443603515625, 1.46844482421875, 1.592529296875, 1.71661376953125, 1.8406982421875, 1.96478271484375, 2.0888671875, 2.21295166015625, 2.3370361328125, 2.46112060546875, 2.585205078125, 2.70928955078125, 2.8333740234375, 2.95745849609375, 3.08154296875, 3.20562744140625, 3.3297119140625, 3.45379638671875, 3.577880859375, 3.70196533203125, 3.8260498046875, 3.95013427734375, 4.07421875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 5.0, 8.0, 5.0, 16.0, 27.0, 21.0, 41.0, 60.0, 98.0, 134.0, 196.0, 292.0, 438.0, 632.0, 910.0, 1434.0, 2152.0, 3368.0, 4951.0, 7604.0, 11870.0, 18129.0, 29093.0, 46800.0, 79641.0, 145977.0, 277181.0, 177911.0, 93070.0, 54157.0, 33106.0, 20708.0, 13486.0, 8556.0, 5490.0, 3783.0, 2454.0, 1504.0, 1018.0, 710.0, 517.0, 305.0, 223.0, 169.0, 90.0, 69.0, 45.0, 43.0, 21.0, 17.0, 6.0, 11.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0], "bins": [-0.734375, -0.7118759155273438, -0.6893768310546875, -0.6668777465820312, -0.644378662109375, -0.6218795776367188, -0.5993804931640625, -0.5768814086914062, -0.55438232421875, -0.5318832397460938, -0.5093841552734375, -0.48688507080078125, -0.464385986328125, -0.44188690185546875, -0.4193878173828125, -0.39688873291015625, -0.3743896484375, -0.35189056396484375, -0.3293914794921875, -0.30689239501953125, -0.284393310546875, -0.26189422607421875, -0.2393951416015625, -0.21689605712890625, -0.19439697265625, -0.17189788818359375, -0.1493988037109375, -0.12689971923828125, -0.104400634765625, -0.08190155029296875, -0.0594024658203125, -0.03690338134765625, -0.014404296875, 0.00809478759765625, 0.0305938720703125, 0.05309295654296875, 0.075592041015625, 0.09809112548828125, 0.1205902099609375, 0.14308929443359375, 0.16558837890625, 0.18808746337890625, 0.2105865478515625, 0.23308563232421875, 0.255584716796875, 0.27808380126953125, 0.3005828857421875, 0.32308197021484375, 0.3455810546875, 0.36808013916015625, 0.3905792236328125, 0.41307830810546875, 0.435577392578125, 0.45807647705078125, 0.4805755615234375, 0.5030746459960938, 0.52557373046875, 0.5480728149414062, 0.5705718994140625, 0.5930709838867188, 0.615570068359375, 0.6380691528320312, 0.6605682373046875, 0.6830673217773438, 0.70556640625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 9.0, 8.0, 9.0, 5.0, 12.0, 15.0, 9.0, 15.0, 23.0, 35.0, 23.0, 28.0, 41.0, 41.0, 35.0, 38.0, 35.0, 31.0, 49.0, 36.0, 1071.0, 40.0, 40.0, 36.0, 35.0, 41.0, 28.0, 24.0, 37.0, 26.0, 32.0, 20.0, 14.0, 21.0, 16.0, 8.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.83203125, -2.747344970703125, -2.66265869140625, -2.577972412109375, -2.4932861328125, -2.408599853515625, -2.32391357421875, -2.239227294921875, -2.154541015625, -2.069854736328125, -1.98516845703125, -1.900482177734375, -1.8157958984375, -1.731109619140625, -1.64642333984375, -1.561737060546875, -1.47705078125, -1.392364501953125, -1.30767822265625, -1.222991943359375, -1.1383056640625, -1.053619384765625, -0.96893310546875, -0.884246826171875, -0.799560546875, -0.714874267578125, -0.63018798828125, -0.545501708984375, -0.4608154296875, -0.376129150390625, -0.29144287109375, -0.206756591796875, -0.1220703125, -0.037384033203125, 0.04730224609375, 0.131988525390625, 0.2166748046875, 0.301361083984375, 0.38604736328125, 0.470733642578125, 0.555419921875, 0.640106201171875, 0.72479248046875, 0.809478759765625, 0.8941650390625, 0.978851318359375, 1.06353759765625, 1.148223876953125, 1.23291015625, 1.317596435546875, 1.40228271484375, 1.486968994140625, 1.5716552734375, 1.656341552734375, 1.74102783203125, 1.825714111328125, 1.910400390625, 1.995086669921875, 2.07977294921875, 2.164459228515625, 2.2491455078125, 2.333831787109375, 2.41851806640625, 2.503204345703125, 2.587890625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 13.0, 19.0, 28.0, 39.0, 61.0, 93.0, 155.0, 211.0, 334.0, 491.0, 703.0, 1066.0, 1593.0, 2403.0, 3568.0, 5539.0, 8612.0, 13501.0, 21433.0, 34299.0, 58389.0, 104573.0, 218118.0, 1319128.0, 124744.0, 68872.0, 40489.0, 24676.0, 15432.0, 9776.0, 6370.0, 4159.0, 2762.0, 1890.0, 1277.0, 814.0, 529.0, 345.0, 218.0, 149.0, 99.0, 56.0, 28.0, 33.0, 18.0, 5.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7587890625, -0.7358932495117188, -0.7129974365234375, -0.6901016235351562, -0.667205810546875, -0.6443099975585938, -0.6214141845703125, -0.5985183715820312, -0.57562255859375, -0.5527267456054688, -0.5298309326171875, -0.5069351196289062, -0.484039306640625, -0.46114349365234375, -0.4382476806640625, -0.41535186767578125, -0.3924560546875, -0.36956024169921875, -0.3466644287109375, -0.32376861572265625, -0.300872802734375, -0.27797698974609375, -0.2550811767578125, -0.23218536376953125, -0.20928955078125, -0.18639373779296875, -0.1634979248046875, -0.14060211181640625, -0.117706298828125, -0.09481048583984375, -0.0719146728515625, -0.04901885986328125, -0.026123046875, -0.00322723388671875, 0.0196685791015625, 0.04256439208984375, 0.065460205078125, 0.08835601806640625, 0.1112518310546875, 0.13414764404296875, 0.15704345703125, 0.17993927001953125, 0.2028350830078125, 0.22573089599609375, 0.248626708984375, 0.27152252197265625, 0.2944183349609375, 0.31731414794921875, 0.3402099609375, 0.36310577392578125, 0.3860015869140625, 0.40889739990234375, 0.431793212890625, 0.45468902587890625, 0.4775848388671875, 0.5004806518554688, 0.52337646484375, 0.5462722778320312, 0.5691680908203125, 0.5920639038085938, 0.614959716796875, 0.6378555297851562, 0.6607513427734375, 0.6836471557617188, 0.70654296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 5.0, 10.0, 14.0, 11.0, 13.0, 17.0, 19.0, 32.0, 32.0, 41.0, 56.0, 57.0, 63.0, 65.0, 78.0, 84.0, 71.0, 53.0, 33.0, 46.0, 41.0, 36.0, 22.0, 18.0, 15.0, 12.0, 8.0, 3.0, 15.0, 4.0, 5.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004181861877441406, -0.000403478741645813, -0.00038877129554748535, -0.0003740638494491577, -0.0003593564033508301, -0.00034464895725250244, -0.0003299415111541748, -0.00031523406505584717, -0.00030052661895751953, -0.0002858191728591919, -0.00027111172676086426, -0.0002564042806625366, -0.00024169683456420898, -0.00022698938846588135, -0.0002122819423675537, -0.00019757449626922607, -0.00018286705017089844, -0.0001681596040725708, -0.00015345215797424316, -0.00013874471187591553, -0.0001240372657775879, -0.00010932981967926025, -9.462237358093262e-05, -7.991492748260498e-05, -6.520748138427734e-05, -5.050003528594971e-05, -3.579258918762207e-05, -2.1085143089294434e-05, -6.377696990966797e-06, 8.32974910736084e-06, 2.3037195205688477e-05, 3.774464130401611e-05, 5.245208740234375e-05, 6.715953350067139e-05, 8.186697959899902e-05, 9.657442569732666e-05, 0.0001112818717956543, 0.00012598931789398193, 0.00014069676399230957, 0.0001554042100906372, 0.00017011165618896484, 0.00018481910228729248, 0.00019952654838562012, 0.00021423399448394775, 0.0002289414405822754, 0.00024364888668060303, 0.00025835633277893066, 0.0002730637788772583, 0.00028777122497558594, 0.0003024786710739136, 0.0003171861171722412, 0.00033189356327056885, 0.0003466010093688965, 0.0003613084554672241, 0.00037601590156555176, 0.0003907233476638794, 0.00040543079376220703, 0.00042013823986053467, 0.0004348456859588623, 0.00044955313205718994, 0.0004642605781555176, 0.0004789680242538452, 0.0004936754703521729, 0.0005083829164505005, 0.0005230903625488281]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 6.0, 3.0, 4.0, 5.0, 6.0, 13.0, 17.0, 20.0, 21.0, 21.0, 38.0, 41.0, 66.0, 94.0, 135.0, 198.0, 283.0, 555.0, 1271.0, 362612.0, 680038.0, 1544.0, 603.0, 303.0, 187.0, 130.0, 80.0, 67.0, 31.0, 35.0, 28.0, 26.0, 17.0, 13.0, 11.0, 6.0, 4.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.01032257080078125, -0.010043919086456299, -0.009765267372131348, -0.009486615657806396, -0.009207963943481445, -0.008929312229156494, -0.008650660514831543, -0.008372008800506592, -0.00809335708618164, -0.00781470537185669, -0.007536053657531738, -0.007257401943206787, -0.006978750228881836, -0.006700098514556885, -0.006421446800231934, -0.006142795085906982, -0.005864143371582031, -0.00558549165725708, -0.005306839942932129, -0.005028188228607178, -0.0047495365142822266, -0.004470884799957275, -0.004192233085632324, -0.003913581371307373, -0.003634929656982422, -0.0033562779426574707, -0.0030776262283325195, -0.0027989745140075684, -0.002520322799682617, -0.002241671085357666, -0.001963019371032715, -0.0016843676567077637, -0.0014057159423828125, -0.0011270642280578613, -0.0008484125137329102, -0.000569760799407959, -0.0002911090850830078, -1.245737075805664e-05, 0.00026619434356689453, 0.0005448460578918457, 0.0008234977722167969, 0.001102149486541748, 0.0013808012008666992, 0.0016594529151916504, 0.0019381046295166016, 0.0022167563438415527, 0.002495408058166504, 0.002774059772491455, 0.0030527114868164062, 0.0033313632011413574, 0.0036100149154663086, 0.0038886666297912598, 0.004167318344116211, 0.004445970058441162, 0.004724621772766113, 0.0050032734870910645, 0.005281925201416016, 0.005560576915740967, 0.005839228630065918, 0.006117880344390869, 0.00639653205871582, 0.0066751837730407715, 0.006953835487365723, 0.007232487201690674, 0.007511138916015625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 14.0, 49.0, 103.0, 199.0, 230.0, 177.0, 139.0, 57.0, 20.0, 15.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006207413389347494, -0.0006061834865249693, -0.0005916256923228502, -0.0005770678399130702, -0.0005625099875032902, -0.0005479521350935102, -0.0005333942826837301, -0.000518836488481611, -0.000504278636071831, -0.000489720783662051, -0.0004751629603561014, -0.0004606051370501518, -0.0004460472846403718, -0.0004314894322305918, -0.0004169316089246422, -0.00040237378561869264, -0.0003878159332089126, -0.0003732580807991326, -0.000358700257493183, -0.00034414243418723345, -0.0003295845817774534, -0.0003150267293676734, -0.00030046890606172383, -0.00028591108275577426, -0.00027135323034599423, -0.0002567953779362142, -0.00024223755463026464, -0.00022767971677239984, -0.00021312187891453505, -0.00019856404105667025, -0.00018400620319880545, -0.00016944836534094065, -0.00015489052748307586, -0.00014033268962521106, -0.00012577485176734626, -0.00011121701390948147, -9.665917605161667e-05, -8.210133819375187e-05, -6.754350033588707e-05, -5.298566247802228e-05, -3.842782462015748e-05, -2.3869986762292683e-05, -9.312148904427886e-06, 5.245688953436911e-06, 1.9803526811301708e-05, 3.4361364669166505e-05, 4.89192025270313e-05, 6.34770403848961e-05, 7.80348782427609e-05, 9.25927161006257e-05, 0.00010715055395849049, 0.00012170839181635529, 0.00013626622967422009, 0.00015082406753208488, 0.00016538190538994968, 0.00017993974324781448, 0.00019449758110567927, 0.00020905541896354407, 0.00022361325682140887, 0.00023817109467927366, 0.00025272893253713846, 0.0002672867849469185, 0.00028184460825286806, 0.0002964024315588176, 0.00031096028396859765]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 6.0, 7.0, 9.0, 3.0, 6.0, 11.0, 10.0, 13.0, 10.0, 17.0, 15.0, 17.0, 30.0, 32.0, 35.0, 35.0, 32.0, 24.0, 38.0, 49.0, 45.0, 29.0, 35.0, 36.0, 32.0, 35.0, 34.0, 41.0, 35.0, 30.0, 33.0, 29.0, 34.0, 21.0, 20.0, 29.0, 18.0, 13.0, 19.0, 6.0, 8.0, 3.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00019699335098266602, -0.0001905057579278946, -0.00018401816487312317, -0.00017753057181835175, -0.00017104297876358032, -0.0001645553857088089, -0.00015806779265403748, -0.00015158019959926605, -0.00014509260654449463, -0.0001386050134897232, -0.00013211742043495178, -0.00012562982738018036, -0.00011914223432540894, -0.00011265464127063751, -0.00010616704821586609, -9.967945516109467e-05, -9.319186210632324e-05, -8.670426905155182e-05, -8.02166759967804e-05, -7.372908294200897e-05, -6.724148988723755e-05, -6.0753896832466125e-05, -5.42663037776947e-05, -4.777871072292328e-05, -4.1291117668151855e-05, -3.480352461338043e-05, -2.831593155860901e-05, -2.1828338503837585e-05, -1.5340745449066162e-05, -8.853152394294739e-06, -2.3655593395233154e-06, 4.122033715248108e-06, 1.0609626770019531e-05, 1.7097219824790955e-05, 2.3584812879562378e-05, 3.00724059343338e-05, 3.6559998989105225e-05, 4.304759204387665e-05, 4.953518509864807e-05, 5.6022778153419495e-05, 6.251037120819092e-05, 6.899796426296234e-05, 7.548555731773376e-05, 8.197315037250519e-05, 8.846074342727661e-05, 9.494833648204803e-05, 0.00010143592953681946, 0.00010792352259159088, 0.0001144111156463623, 0.00012089870870113373, 0.00012738630175590515, 0.00013387389481067657, 0.000140361487865448, 0.00014684908092021942, 0.00015333667397499084, 0.00015982426702976227, 0.0001663118600845337, 0.00017279945313930511, 0.00017928704619407654, 0.00018577463924884796, 0.00019226223230361938, 0.0001987498253583908, 0.00020523741841316223, 0.00021172501146793365, 0.00021821260452270508]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 10.0, 6.0, 12.0, 9.0, 15.0, 16.0, 17.0, 17.0, 33.0, 21.0, 28.0, 27.0, 33.0, 33.0, 30.0, 41.0, 43.0, 32.0, 51.0, 44.0, 36.0, 37.0, 33.0, 42.0, 36.0, 36.0, 31.0, 28.0, 29.0, 27.0, 19.0, 20.0, 19.0, 10.0, 13.0, 8.0, 14.0, 10.0, 7.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.74310302734375, -3.6190185546875, -3.49493408203125, -3.370849609375, -3.24676513671875, -3.1226806640625, -2.99859619140625, -2.87451171875, -2.75042724609375, -2.6263427734375, -2.50225830078125, -2.378173828125, -2.25408935546875, -2.1300048828125, -2.00592041015625, -1.8818359375, -1.75775146484375, -1.6336669921875, -1.50958251953125, -1.385498046875, -1.26141357421875, -1.1373291015625, -1.01324462890625, -0.88916015625, -0.76507568359375, -0.6409912109375, -0.51690673828125, -0.392822265625, -0.26873779296875, -0.1446533203125, -0.02056884765625, 0.103515625, 0.22760009765625, 0.3516845703125, 0.47576904296875, 0.599853515625, 0.72393798828125, 0.8480224609375, 0.97210693359375, 1.09619140625, 1.22027587890625, 1.3443603515625, 1.46844482421875, 1.592529296875, 1.71661376953125, 1.8406982421875, 1.96478271484375, 2.0888671875, 2.21295166015625, 2.3370361328125, 2.46112060546875, 2.585205078125, 2.70928955078125, 2.8333740234375, 2.95745849609375, 3.08154296875, 3.20562744140625, 3.3297119140625, 3.45379638671875, 3.577880859375, 3.70196533203125, 3.8260498046875, 3.95013427734375, 4.07421875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 8.0, 3.0, 6.0, 9.0, 15.0, 22.0, 30.0, 39.0, 57.0, 61.0, 64.0, 97.0, 124.0, 192.0, 253.0, 346.0, 500.0, 767.0, 1344.0, 2880.0, 6768.0, 20609.0, 68648.0, 207210.0, 379909.0, 237712.0, 81141.0, 24673.0, 7712.0, 3034.0, 1558.0, 868.0, 510.0, 351.0, 267.0, 177.0, 140.0, 102.0, 107.0, 65.0, 39.0, 41.0, 23.0, 18.0, 19.0, 18.0, 6.0, 9.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.0390625, -4.87945556640625, -4.7198486328125, -4.56024169921875, -4.400634765625, -4.24102783203125, -4.0814208984375, -3.92181396484375, -3.76220703125, -3.60260009765625, -3.4429931640625, -3.28338623046875, -3.123779296875, -2.96417236328125, -2.8045654296875, -2.64495849609375, -2.4853515625, -2.32574462890625, -2.1661376953125, -2.00653076171875, -1.846923828125, -1.68731689453125, -1.5277099609375, -1.36810302734375, -1.20849609375, -1.04888916015625, -0.8892822265625, -0.72967529296875, -0.570068359375, -0.41046142578125, -0.2508544921875, -0.09124755859375, 0.068359375, 0.22796630859375, 0.3875732421875, 0.54718017578125, 0.706787109375, 0.86639404296875, 1.0260009765625, 1.18560791015625, 1.34521484375, 1.50482177734375, 1.6644287109375, 1.82403564453125, 1.983642578125, 2.14324951171875, 2.3028564453125, 2.46246337890625, 2.6220703125, 2.78167724609375, 2.9412841796875, 3.10089111328125, 3.260498046875, 3.42010498046875, 3.5797119140625, 3.73931884765625, 3.89892578125, 4.05853271484375, 4.2181396484375, 4.37774658203125, 4.537353515625, 4.69696044921875, 4.8565673828125, 5.01617431640625, 5.17578125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 10.0, 7.0, 16.0, 14.0, 16.0, 23.0, 27.0, 27.0, 30.0, 33.0, 41.0, 52.0, 54.0, 77.0, 162.0, 323.0, 1413.0, 185.0, 87.0, 73.0, 57.0, 48.0, 39.0, 44.0, 38.0, 22.0, 27.0, 22.0, 14.0, 13.0, 5.0, 8.0, 4.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.8125, -11.4320068359375, -11.051513671875, -10.6710205078125, -10.29052734375, -9.9100341796875, -9.529541015625, -9.1490478515625, -8.7685546875, -8.3880615234375, -8.007568359375, -7.6270751953125, -7.24658203125, -6.8660888671875, -6.485595703125, -6.1051025390625, -5.724609375, -5.3441162109375, -4.963623046875, -4.5831298828125, -4.20263671875, -3.8221435546875, -3.441650390625, -3.0611572265625, -2.6806640625, -2.3001708984375, -1.919677734375, -1.5391845703125, -1.15869140625, -0.7781982421875, -0.397705078125, -0.0172119140625, 0.36328125, 0.7437744140625, 1.124267578125, 1.5047607421875, 1.88525390625, 2.2657470703125, 2.646240234375, 3.0267333984375, 3.4072265625, 3.7877197265625, 4.168212890625, 4.5487060546875, 4.92919921875, 5.3096923828125, 5.690185546875, 6.0706787109375, 6.451171875, 6.8316650390625, 7.212158203125, 7.5926513671875, 7.97314453125, 8.3536376953125, 8.734130859375, 9.1146240234375, 9.4951171875, 9.8756103515625, 10.256103515625, 10.6365966796875, 11.01708984375, 11.3975830078125, 11.778076171875, 12.1585693359375, 12.5390625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 3.0, 15.0, 12.0, 17.0, 30.0, 40.0, 49.0, 71.0, 86.0, 132.0, 249.0, 356.0, 612.0, 1252.0, 6442.0, 2666720.0, 463996.0, 3304.0, 896.0, 480.0, 305.0, 208.0, 135.0, 85.0, 55.0, 42.0, 33.0, 15.0, 25.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.953125, -30.09033203125, -29.2275390625, -28.36474609375, -27.501953125, -26.63916015625, -25.7763671875, -24.91357421875, -24.05078125, -23.18798828125, -22.3251953125, -21.46240234375, -20.599609375, -19.73681640625, -18.8740234375, -18.01123046875, -17.1484375, -16.28564453125, -15.4228515625, -14.56005859375, -13.697265625, -12.83447265625, -11.9716796875, -11.10888671875, -10.24609375, -9.38330078125, -8.5205078125, -7.65771484375, -6.794921875, -5.93212890625, -5.0693359375, -4.20654296875, -3.34375, -2.48095703125, -1.6181640625, -0.75537109375, 0.107421875, 0.97021484375, 1.8330078125, 2.69580078125, 3.55859375, 4.42138671875, 5.2841796875, 6.14697265625, 7.009765625, 7.87255859375, 8.7353515625, 9.59814453125, 10.4609375, 11.32373046875, 12.1865234375, 13.04931640625, 13.912109375, 14.77490234375, 15.6376953125, 16.50048828125, 17.36328125, 18.22607421875, 19.0888671875, 19.95166015625, 20.814453125, 21.67724609375, 22.5400390625, 23.40283203125, 24.265625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 91.0, 584.0, 316.0, 17.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.23248291015625, -66.64657592773438, -64.0606689453125, -61.474761962890625, -58.888858795166016, -56.30295181274414, -53.717044830322266, -51.131141662597656, -48.54523468017578, -45.959327697753906, -43.37342071533203, -40.787513732910156, -38.20161056518555, -35.61570358276367, -33.0297966003418, -30.443891525268555, -27.857982635498047, -25.272075653076172, -22.68617057800293, -20.100263595581055, -17.514358520507812, -14.928451538085938, -12.342544555664062, -9.75663948059082, -7.170732498168945, -4.584826469421387, -1.99891996383667, 0.5869865417480469, 3.1728925704956055, 5.758798599243164, 8.344705581665039, 10.930610656738281, 13.516517639160156, 16.10242462158203, 18.688329696655273, 21.27423667907715, 23.86014175415039, 26.446048736572266, 29.03195571899414, 31.617860794067383, 34.203765869140625, 36.7896728515625, 39.375579833984375, 41.96148681640625, 44.54738998413086, 47.133296966552734, 49.71920394897461, 52.30510711669922, 54.89101791381836, 57.476924896240234, 60.06283187866211, 62.64873504638672, 65.2346420288086, 67.82054901123047, 70.40645599365234, 72.99236297607422, 75.5782699584961, 78.16417694091797, 80.75008392333984, 83.33599090576172, 85.9218978881836, 88.50779724121094, 91.09370422363281, 93.67961120605469, 96.26551818847656]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 9.0, 7.0, 11.0, 16.0, 25.0, 24.0, 25.0, 22.0, 30.0, 31.0, 36.0, 43.0, 41.0, 43.0, 45.0, 49.0, 59.0, 38.0, 54.0, 54.0, 42.0, 35.0, 35.0, 25.0, 23.0, 38.0, 27.0, 21.0, 14.0, 18.0, 12.0, 13.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.111183166503906, -21.219919204711914, -20.328655242919922, -19.437393188476562, -18.54612922668457, -17.654865264892578, -16.76360321044922, -15.872339248657227, -14.981075286865234, -14.089811325073242, -13.198548316955566, -12.30728530883789, -11.416021347045898, -10.524757385253906, -9.63349437713623, -8.742231369018555, -7.8509674072265625, -6.9597039222717285, -6.0684404373168945, -5.1771769523620605, -4.285913467407227, -3.3946499824523926, -2.5033864974975586, -1.6121230125427246, -0.7208595275878906, 0.17040395736694336, 1.0616674423217773, 1.9529309272766113, 2.8441944122314453, 3.7354578971862793, 4.626721382141113, 5.517984867095947, 6.409248352050781, 7.300511837005615, 8.19177532196045, 9.083038330078125, 9.974302291870117, 10.86556625366211, 11.756829261779785, 12.648092269897461, 13.539356231689453, 14.430620193481445, 15.321883201599121, 16.213146209716797, 17.10441017150879, 17.99567413330078, 18.88693618774414, 19.778200149536133, 20.669464111328125, 21.560728073120117, 22.45199203491211, 23.34325408935547, 24.23451805114746, 25.125782012939453, 26.017044067382812, 26.908308029174805, 27.799571990966797, 28.69083595275879, 29.58209991455078, 30.47336196899414, 31.364625930786133, 32.255889892578125, 33.147151947021484, 34.03841781616211, 34.92967987060547]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 11.0, 15.0, 16.0, 17.0, 21.0, 22.0, 29.0, 27.0, 30.0, 29.0, 39.0, 32.0, 36.0, 36.0, 45.0, 52.0, 41.0, 52.0, 31.0, 35.0, 47.0, 39.0, 25.0, 26.0, 26.0, 35.0, 22.0, 23.0, 25.0, 18.0, 13.0, 5.0, 14.0, 6.0, 13.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.935546875, -3.810150146484375, -3.68475341796875, -3.559356689453125, -3.4339599609375, -3.308563232421875, -3.18316650390625, -3.057769775390625, -2.932373046875, -2.806976318359375, -2.68157958984375, -2.556182861328125, -2.4307861328125, -2.305389404296875, -2.17999267578125, -2.054595947265625, -1.92919921875, -1.803802490234375, -1.67840576171875, -1.553009033203125, -1.4276123046875, -1.302215576171875, -1.17681884765625, -1.051422119140625, -0.926025390625, -0.800628662109375, -0.67523193359375, -0.549835205078125, -0.4244384765625, -0.299041748046875, -0.17364501953125, -0.048248291015625, 0.0771484375, 0.202545166015625, 0.32794189453125, 0.453338623046875, 0.5787353515625, 0.704132080078125, 0.82952880859375, 0.954925537109375, 1.080322265625, 1.205718994140625, 1.33111572265625, 1.456512451171875, 1.5819091796875, 1.707305908203125, 1.83270263671875, 1.958099365234375, 2.08349609375, 2.208892822265625, 2.33428955078125, 2.459686279296875, 2.5850830078125, 2.710479736328125, 2.83587646484375, 2.961273193359375, 3.086669921875, 3.212066650390625, 3.33746337890625, 3.462860107421875, 3.5882568359375, 3.713653564453125, 3.83905029296875, 3.964447021484375, 4.08984375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 4.0, 3.0, 7.0, 7.0, 9.0, 14.0, 10.0, 19.0, 24.0, 28.0, 25.0, 34.0, 36.0, 61.0, 75.0, 100.0, 129.0, 179.0, 236.0, 258.0, 340.0, 599.0, 25928.0, 4161698.0, 2541.0, 438.0, 319.0, 251.0, 214.0, 152.0, 101.0, 92.0, 58.0, 52.0, 51.0, 30.0, 31.0, 25.0, 21.0, 13.0, 13.0, 8.0, 10.0, 11.0, 6.0, 6.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-40.53125, -39.150390625, -37.76953125, -36.388671875, -35.0078125, -33.626953125, -32.24609375, -30.865234375, -29.484375, -28.103515625, -26.72265625, -25.341796875, -23.9609375, -22.580078125, -21.19921875, -19.818359375, -18.4375, -17.056640625, -15.67578125, -14.294921875, -12.9140625, -11.533203125, -10.15234375, -8.771484375, -7.390625, -6.009765625, -4.62890625, -3.248046875, -1.8671875, -0.486328125, 0.89453125, 2.275390625, 3.65625, 5.037109375, 6.41796875, 7.798828125, 9.1796875, 10.560546875, 11.94140625, 13.322265625, 14.703125, 16.083984375, 17.46484375, 18.845703125, 20.2265625, 21.607421875, 22.98828125, 24.369140625, 25.75, 27.130859375, 28.51171875, 29.892578125, 31.2734375, 32.654296875, 34.03515625, 35.416015625, 36.796875, 38.177734375, 39.55859375, 40.939453125, 42.3203125, 43.701171875, 45.08203125, 46.462890625, 47.84375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 3.0, 10.0, 12.0, 9.0, 22.0, 28.0, 40.0, 62.0, 85.0, 134.0, 164.0, 241.0, 374.0, 496.0, 593.0, 565.0, 371.0, 242.0, 162.0, 122.0, 100.0, 48.0, 47.0, 39.0, 18.0, 26.0, 9.0, 13.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.61328125, -5.4095458984375, -5.205810546875, -5.0020751953125, -4.79833984375, -4.5946044921875, -4.390869140625, -4.1871337890625, -3.9833984375, -3.7796630859375, -3.575927734375, -3.3721923828125, -3.16845703125, -2.9647216796875, -2.760986328125, -2.5572509765625, -2.353515625, -2.1497802734375, -1.946044921875, -1.7423095703125, -1.53857421875, -1.3348388671875, -1.131103515625, -0.9273681640625, -0.7236328125, -0.5198974609375, -0.316162109375, -0.1124267578125, 0.09130859375, 0.2950439453125, 0.498779296875, 0.7025146484375, 0.90625, 1.1099853515625, 1.313720703125, 1.5174560546875, 1.72119140625, 1.9249267578125, 2.128662109375, 2.3323974609375, 2.5361328125, 2.7398681640625, 2.943603515625, 3.1473388671875, 3.35107421875, 3.5548095703125, 3.758544921875, 3.9622802734375, 4.166015625, 4.3697509765625, 4.573486328125, 4.7772216796875, 4.98095703125, 5.1846923828125, 5.388427734375, 5.5921630859375, 5.7958984375, 5.9996337890625, 6.203369140625, 6.4071044921875, 6.61083984375, 6.8145751953125, 7.018310546875, 7.2220458984375, 7.42578125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 3.0, 15.0, 17.0, 10.0, 17.0, 35.0, 46.0, 53.0, 77.0, 104.0, 224.0, 789.0, 27606.0, 4117399.0, 46294.0, 955.0, 222.0, 95.0, 63.0, 69.0, 43.0, 29.0, 22.0, 18.0, 15.0, 9.0, 11.0, 9.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.5, -38.44775390625, -37.3955078125, -36.34326171875, -35.291015625, -34.23876953125, -33.1865234375, -32.13427734375, -31.08203125, -30.02978515625, -28.9775390625, -27.92529296875, -26.873046875, -25.82080078125, -24.7685546875, -23.71630859375, -22.6640625, -21.61181640625, -20.5595703125, -19.50732421875, -18.455078125, -17.40283203125, -16.3505859375, -15.29833984375, -14.24609375, -13.19384765625, -12.1416015625, -11.08935546875, -10.037109375, -8.98486328125, -7.9326171875, -6.88037109375, -5.828125, -4.77587890625, -3.7236328125, -2.67138671875, -1.619140625, -0.56689453125, 0.4853515625, 1.53759765625, 2.58984375, 3.64208984375, 4.6943359375, 5.74658203125, 6.798828125, 7.85107421875, 8.9033203125, 9.95556640625, 11.0078125, 12.06005859375, 13.1123046875, 14.16455078125, 15.216796875, 16.26904296875, 17.3212890625, 18.37353515625, 19.42578125, 20.47802734375, 21.5302734375, 22.58251953125, 23.634765625, 24.68701171875, 25.7392578125, 26.79150390625, 27.84375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 142.0, 685.0, 175.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-213.35162353515625, -209.44268798828125, -205.53375244140625, -201.6248016357422, -197.7158660888672, -193.8069305419922, -189.89797973632812, -185.98904418945312, -182.08010864257812, -178.17117309570312, -174.26223754882812, -170.35328674316406, -166.44435119628906, -162.53541564941406, -158.62646484375, -154.717529296875, -150.80859375, -146.899658203125, -142.99072265625, -139.08177185058594, -135.17283630371094, -131.26390075683594, -127.3549575805664, -123.44601440429688, -119.53707885742188, -115.62814331054688, -111.71920013427734, -107.81025695800781, -103.90132141113281, -99.99238586425781, -96.08344268798828, -92.17449951171875, -88.26556396484375, -84.35662841796875, -80.44768524169922, -76.53874206542969, -72.62980651855469, -68.72087097167969, -64.81192779541016, -60.90298843383789, -56.994049072265625, -53.08510971069336, -49.176170349121094, -45.26723098754883, -41.35829162597656, -37.4493522644043, -33.54041290283203, -29.631473541259766, -25.7225341796875, -21.813594818115234, -17.90465545654297, -13.995716094970703, -10.086776733398438, -6.177837371826172, -2.2688980102539062, 1.6400413513183594, 5.548980712890625, 9.45792007446289, 13.366859436035156, 17.275798797607422, 21.184738159179688, 25.093677520751953, 29.00261688232422, 32.911556243896484, 36.82049560546875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 7.0, 3.0, 11.0, 11.0, 14.0, 12.0, 11.0, 16.0, 22.0, 27.0, 26.0, 32.0, 38.0, 45.0, 32.0, 36.0, 52.0, 56.0, 42.0, 41.0, 44.0, 47.0, 44.0, 40.0, 45.0, 21.0, 27.0, 29.0, 27.0, 24.0, 23.0, 15.0, 18.0, 10.0, 10.0, 8.0, 10.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.761035919189453, -19.073503494262695, -18.385971069335938, -17.69843864440918, -17.010906219482422, -16.323373794555664, -15.635842323303223, -14.948309898376465, -14.260777473449707, -13.57324504852295, -12.885712623596191, -12.19818115234375, -11.510648727416992, -10.823116302490234, -10.135583877563477, -9.448051452636719, -8.760519027709961, -8.072986602783203, -7.385454177856445, -6.697922229766846, -6.010389804840088, -5.32285737991333, -4.6353254318237305, -3.9477930068969727, -3.260260581970215, -2.572728157043457, -1.8851959705352783, -1.1976637840270996, -0.5101313591003418, 0.17740106582641602, 0.8649330139160156, 1.5524654388427734, 2.2399978637695312, 2.927530288696289, 3.6150624752044678, 4.3025946617126465, 4.990127086639404, 5.677659511566162, 6.365191459655762, 7.0527238845825195, 7.740256309509277, 8.427788734436035, 9.115321159362793, 9.802852630615234, 10.490385055541992, 11.17791748046875, 11.865449905395508, 12.552982330322266, 13.240514755249023, 13.928047180175781, 14.615579605102539, 15.303112030029297, 15.990644454956055, 16.678176879882812, 17.365707397460938, 18.053241729736328, 18.740772247314453, 19.42830467224121, 20.11583709716797, 20.803369522094727, 21.490901947021484, 22.178434371948242, 22.865966796875, 23.553497314453125, 24.241031646728516]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 6.0, 8.0, 19.0, 11.0, 14.0, 15.0, 25.0, 26.0, 22.0, 26.0, 30.0, 29.0, 33.0, 47.0, 41.0, 39.0, 60.0, 47.0, 40.0, 48.0, 39.0, 52.0, 31.0, 40.0, 35.0, 33.0, 33.0, 24.0, 23.0, 21.0, 14.0, 10.0, 9.0, 5.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.0982666015625, -2.973876953125, -2.8494873046875, -2.72509765625, -2.6007080078125, -2.476318359375, -2.3519287109375, -2.2275390625, -2.1031494140625, -1.978759765625, -1.8543701171875, -1.72998046875, -1.6055908203125, -1.481201171875, -1.3568115234375, -1.232421875, -1.1080322265625, -0.983642578125, -0.8592529296875, -0.73486328125, -0.6104736328125, -0.486083984375, -0.3616943359375, -0.2373046875, -0.1129150390625, 0.011474609375, 0.1358642578125, 0.26025390625, 0.3846435546875, 0.509033203125, 0.6334228515625, 0.7578125, 0.8822021484375, 1.006591796875, 1.1309814453125, 1.25537109375, 1.3797607421875, 1.504150390625, 1.6285400390625, 1.7529296875, 1.8773193359375, 2.001708984375, 2.1260986328125, 2.25048828125, 2.3748779296875, 2.499267578125, 2.6236572265625, 2.748046875, 2.8724365234375, 2.996826171875, 3.1212158203125, 3.24560546875, 3.3699951171875, 3.494384765625, 3.6187744140625, 3.7431640625, 3.8675537109375, 3.991943359375, 4.1163330078125, 4.24072265625, 4.3651123046875, 4.489501953125, 4.6138916015625, 4.73828125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 11.0, 15.0, 22.0, 22.0, 45.0, 55.0, 101.0, 138.0, 199.0, 344.0, 491.0, 831.0, 1196.0, 1979.0, 3070.0, 5110.0, 8209.0, 13514.0, 22336.0, 39223.0, 73963.0, 152494.0, 319746.0, 197485.0, 92267.0, 47844.0, 26828.0, 15707.0, 9450.0, 5811.0, 3616.0, 2281.0, 1464.0, 959.0, 646.0, 402.0, 245.0, 127.0, 112.0, 69.0, 54.0, 16.0, 20.0, 14.0, 13.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.796875, -0.7724761962890625, -0.748077392578125, -0.7236785888671875, -0.69927978515625, -0.6748809814453125, -0.650482177734375, -0.6260833740234375, -0.6016845703125, -0.5772857666015625, -0.552886962890625, -0.5284881591796875, -0.50408935546875, -0.4796905517578125, -0.455291748046875, -0.4308929443359375, -0.406494140625, -0.3820953369140625, -0.357696533203125, -0.3332977294921875, -0.30889892578125, -0.2845001220703125, -0.260101318359375, -0.2357025146484375, -0.2113037109375, -0.1869049072265625, -0.162506103515625, -0.1381072998046875, -0.11370849609375, -0.0893096923828125, -0.064910888671875, -0.0405120849609375, -0.01611328125, 0.0082855224609375, 0.032684326171875, 0.0570831298828125, 0.08148193359375, 0.1058807373046875, 0.130279541015625, 0.1546783447265625, 0.1790771484375, 0.2034759521484375, 0.227874755859375, 0.2522735595703125, 0.27667236328125, 0.3010711669921875, 0.325469970703125, 0.3498687744140625, 0.374267578125, 0.3986663818359375, 0.423065185546875, 0.4474639892578125, 0.47186279296875, 0.4962615966796875, 0.520660400390625, 0.5450592041015625, 0.5694580078125, 0.5938568115234375, 0.618255615234375, 0.6426544189453125, 0.66705322265625, 0.6914520263671875, 0.715850830078125, 0.7402496337890625, 0.7646484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 7.0, 8.0, 9.0, 11.0, 11.0, 13.0, 14.0, 23.0, 16.0, 18.0, 24.0, 21.0, 32.0, 25.0, 27.0, 44.0, 35.0, 38.0, 40.0, 50.0, 1067.0, 61.0, 38.0, 39.0, 41.0, 35.0, 36.0, 37.0, 23.0, 18.0, 21.0, 23.0, 23.0, 20.0, 12.0, 14.0, 6.0, 10.0, 7.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.3203125, -2.2471923828125, -2.174072265625, -2.1009521484375, -2.02783203125, -1.9547119140625, -1.881591796875, -1.8084716796875, -1.7353515625, -1.6622314453125, -1.589111328125, -1.5159912109375, -1.44287109375, -1.3697509765625, -1.296630859375, -1.2235107421875, -1.150390625, -1.0772705078125, -1.004150390625, -0.9310302734375, -0.85791015625, -0.7847900390625, -0.711669921875, -0.6385498046875, -0.5654296875, -0.4923095703125, -0.419189453125, -0.3460693359375, -0.27294921875, -0.1998291015625, -0.126708984375, -0.0535888671875, 0.01953125, 0.0926513671875, 0.165771484375, 0.2388916015625, 0.31201171875, 0.3851318359375, 0.458251953125, 0.5313720703125, 0.6044921875, 0.6776123046875, 0.750732421875, 0.8238525390625, 0.89697265625, 0.9700927734375, 1.043212890625, 1.1163330078125, 1.189453125, 1.2625732421875, 1.335693359375, 1.4088134765625, 1.48193359375, 1.5550537109375, 1.628173828125, 1.7012939453125, 1.7744140625, 1.8475341796875, 1.920654296875, 1.9937744140625, 2.06689453125, 2.1400146484375, 2.213134765625, 2.2862548828125, 2.359375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 14.0, 32.0, 42.0, 59.0, 84.0, 136.0, 218.0, 319.0, 469.0, 659.0, 1035.0, 1457.0, 2113.0, 3105.0, 4614.0, 7044.0, 10474.0, 16266.0, 25365.0, 41641.0, 72567.0, 143572.0, 1354955.0, 187743.0, 88379.0, 49409.0, 29877.0, 18768.0, 12129.0, 8035.0, 5419.0, 3652.0, 2514.0, 1667.0, 1079.0, 747.0, 473.0, 333.0, 224.0, 136.0, 92.0, 64.0, 54.0, 27.0, 20.0, 20.0, 9.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.63671875, -0.616607666015625, -0.59649658203125, -0.576385498046875, -0.5562744140625, -0.536163330078125, -0.51605224609375, -0.495941162109375, -0.475830078125, -0.455718994140625, -0.43560791015625, -0.415496826171875, -0.3953857421875, -0.375274658203125, -0.35516357421875, -0.335052490234375, -0.31494140625, -0.294830322265625, -0.27471923828125, -0.254608154296875, -0.2344970703125, -0.214385986328125, -0.19427490234375, -0.174163818359375, -0.154052734375, -0.133941650390625, -0.11383056640625, -0.093719482421875, -0.0736083984375, -0.053497314453125, -0.03338623046875, -0.013275146484375, 0.0068359375, 0.026947021484375, 0.04705810546875, 0.067169189453125, 0.0872802734375, 0.107391357421875, 0.12750244140625, 0.147613525390625, 0.167724609375, 0.187835693359375, 0.20794677734375, 0.228057861328125, 0.2481689453125, 0.268280029296875, 0.28839111328125, 0.308502197265625, 0.32861328125, 0.348724365234375, 0.36883544921875, 0.388946533203125, 0.4090576171875, 0.429168701171875, 0.44927978515625, 0.469390869140625, 0.489501953125, 0.509613037109375, 0.52972412109375, 0.549835205078125, 0.5699462890625, 0.590057373046875, 0.61016845703125, 0.630279541015625, 0.650390625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 12.0, 7.0, 16.0, 20.0, 24.0, 29.0, 35.0, 37.0, 37.0, 44.0, 50.0, 78.0, 67.0, 68.0, 69.0, 56.0, 48.0, 34.0, 36.0, 37.0, 35.0, 29.0, 20.0, 24.0, 14.0, 8.0, 12.0, 8.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00043845176696777344, -0.0004248395562171936, -0.00041122734546661377, -0.00039761513471603394, -0.0003840029239654541, -0.00037039071321487427, -0.00035677850246429443, -0.0003431662917137146, -0.00032955408096313477, -0.00031594187021255493, -0.0003023296594619751, -0.00028871744871139526, -0.00027510523796081543, -0.0002614930272102356, -0.00024788081645965576, -0.00023426860570907593, -0.0002206563949584961, -0.00020704418420791626, -0.00019343197345733643, -0.0001798197627067566, -0.00016620755195617676, -0.00015259534120559692, -0.0001389831304550171, -0.00012537091970443726, -0.00011175870895385742, -9.814649820327759e-05, -8.453428745269775e-05, -7.092207670211792e-05, -5.7309865951538086e-05, -4.369765520095825e-05, -3.0085444450378418e-05, -1.6473233699798584e-05, -2.86102294921875e-06, 1.0751187801361084e-05, 2.4363398551940918e-05, 3.797560930252075e-05, 5.1587820053100586e-05, 6.520003080368042e-05, 7.881224155426025e-05, 9.242445230484009e-05, 0.00010603666305541992, 0.00011964887380599976, 0.0001332610845565796, 0.00014687329530715942, 0.00016048550605773926, 0.0001740977168083191, 0.00018770992755889893, 0.00020132213830947876, 0.0002149343490600586, 0.00022854655981063843, 0.00024215877056121826, 0.0002557709813117981, 0.00026938319206237793, 0.00028299540281295776, 0.0002966076135635376, 0.00031021982431411743, 0.00032383203506469727, 0.0003374442458152771, 0.00035105645656585693, 0.00036466866731643677, 0.0003782808780670166, 0.00039189308881759644, 0.00040550529956817627, 0.0004191175103187561, 0.00043272972106933594]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 8.0, 5.0, 11.0, 12.0, 9.0, 14.0, 28.0, 31.0, 33.0, 56.0, 67.0, 74.0, 83.0, 124.0, 181.0, 329.0, 524.0, 875.0, 3530.0, 1000709.0, 38818.0, 1150.0, 639.0, 365.0, 235.0, 161.0, 106.0, 91.0, 49.0, 52.0, 52.0, 21.0, 16.0, 23.0, 14.0, 12.0, 7.0, 5.0, 3.0, 5.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00760650634765625, -0.007373809814453125, -0.00714111328125, -0.006908416748046875, -0.00667572021484375, -0.006443023681640625, -0.0062103271484375, -0.005977630615234375, -0.00574493408203125, -0.005512237548828125, -0.005279541015625, -0.005046844482421875, -0.00481414794921875, -0.004581451416015625, -0.0043487548828125, -0.004116058349609375, -0.00388336181640625, -0.003650665283203125, -0.00341796875, -0.003185272216796875, -0.00295257568359375, -0.002719879150390625, -0.0024871826171875, -0.002254486083984375, -0.00202178955078125, -0.001789093017578125, -0.001556396484375, -0.001323699951171875, -0.00109100341796875, -0.000858306884765625, -0.0006256103515625, -0.000392913818359375, -0.00016021728515625, 7.2479248046875e-05, 0.00030517578125, 0.000537872314453125, 0.00077056884765625, 0.001003265380859375, 0.0012359619140625, 0.001468658447265625, 0.00170135498046875, 0.001934051513671875, 0.002166748046875, 0.002399444580078125, 0.00263214111328125, 0.002864837646484375, 0.0030975341796875, 0.003330230712890625, 0.00356292724609375, 0.003795623779296875, 0.0040283203125, 0.004261016845703125, 0.00449371337890625, 0.004726409912109375, 0.0049591064453125, 0.005191802978515625, 0.00542449951171875, 0.005657196044921875, 0.005889892578125, 0.006122589111328125, 0.00635528564453125, 0.006587982177734375, 0.0068206787109375, 0.007053375244140625, 0.00728607177734375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 14.0, 372.0, 565.0, 60.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002532385056838393, -0.0024828817695379257, -0.0024333782494068146, -0.002383874962106347, -0.002334371441975236, -0.0022848681546747684, -0.0022353646345436573, -0.00218586134724319, -0.0021363578271120787, -0.002086854539811611, -0.0020373510196805, -0.0019878477323800325, -0.0019383442122489214, -0.001888840808533132, -0.0018393374048173428, -0.0017898340011015534, -0.0017403305973857641, -0.0016908271936699748, -0.0016413237899541855, -0.0015918203862383962, -0.0015423169825226068, -0.0014928135788068175, -0.0014433101750910282, -0.001393806771375239, -0.0013443034840747714, -0.001294800080358982, -0.0012452966766431928, -0.0011957932729274035, -0.0011462898692116141, -0.0010967864654958248, -0.0010472830617800355, -0.0009977796580642462, -0.0009482763125561178, -0.0008987729088403285, -0.0008492695051245391, -0.0007997661014087498, -0.0007502626976929605, -0.0007007593521848321, -0.0006512559484690428, -0.0006017525447532535, -0.0005522491410374641, -0.0005027457373216748, -0.0004532423336058855, -0.0004037389298900962, -0.00035423552617430687, -0.000304732151562348, -0.0002552287478465587, -0.00020572534413076937, -0.0001562219113111496, -0.00010671850759536028, -5.7215111155528575e-05, -7.711714715696871e-06, 4.179168900009245e-05, 9.129507816396654e-05, 0.00014079848187975585, 0.00019030188559554517, 0.0002398052893113345, 0.0002893086930271238, 0.0003388120967429131, 0.000388315471354872, 0.0004378188750706613, 0.0004873222787864506, 0.0005368256825022399, 0.0005863290862180293, 0.0006358324899338186]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 9.0, 10.0, 8.0, 7.0, 12.0, 18.0, 13.0, 16.0, 26.0, 18.0, 41.0, 32.0, 35.0, 34.0, 43.0, 40.0, 46.0, 43.0, 41.0, 43.0, 40.0, 44.0, 46.0, 37.0, 50.0, 36.0, 44.0, 31.0, 19.0, 28.0, 9.0, 11.0, 12.0, 12.0, 11.0, 7.0, 8.0, 5.0, 6.0, 1.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022596120834350586, -0.00021848827600479126, -0.00021101534366607666, -0.00020354241132736206, -0.00019606947898864746, -0.00018859654664993286, -0.00018112361431121826, -0.00017365068197250366, -0.00016617774963378906, -0.00015870481729507446, -0.00015123188495635986, -0.00014375895261764526, -0.00013628602027893066, -0.00012881308794021606, -0.00012134015560150146, -0.00011386722326278687, -0.00010639429092407227, -9.892135858535767e-05, -9.144842624664307e-05, -8.397549390792847e-05, -7.650256156921387e-05, -6.902962923049927e-05, -6.155669689178467e-05, -5.408376455307007e-05, -4.661083221435547e-05, -3.913789987564087e-05, -3.166496753692627e-05, -2.419203519821167e-05, -1.671910285949707e-05, -9.24617052078247e-06, -1.773238182067871e-06, 5.6996941566467285e-06, 1.3172626495361328e-05, 2.0645558834075928e-05, 2.8118491172790527e-05, 3.559142351150513e-05, 4.3064355850219727e-05, 5.0537288188934326e-05, 5.8010220527648926e-05, 6.548315286636353e-05, 7.295608520507812e-05, 8.042901754379272e-05, 8.790194988250732e-05, 9.537488222122192e-05, 0.00010284781455993652, 0.00011032074689865112, 0.00011779367923736572, 0.00012526661157608032, 0.00013273954391479492, 0.00014021247625350952, 0.00014768540859222412, 0.00015515834093093872, 0.00016263127326965332, 0.00017010420560836792, 0.00017757713794708252, 0.00018505007028579712, 0.00019252300262451172, 0.00019999593496322632, 0.00020746886730194092, 0.00021494179964065552, 0.00022241473197937012, 0.00022988766431808472, 0.00023736059665679932, 0.0002448335289955139, 0.0002523064613342285]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 6.0, 8.0, 19.0, 11.0, 14.0, 15.0, 25.0, 26.0, 22.0, 26.0, 30.0, 29.0, 33.0, 47.0, 41.0, 39.0, 60.0, 47.0, 40.0, 48.0, 39.0, 52.0, 31.0, 40.0, 35.0, 33.0, 33.0, 24.0, 23.0, 21.0, 14.0, 10.0, 9.0, 5.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.0982666015625, -2.973876953125, -2.8494873046875, -2.72509765625, -2.6007080078125, -2.476318359375, -2.3519287109375, -2.2275390625, -2.1031494140625, -1.978759765625, -1.8543701171875, -1.72998046875, -1.6055908203125, -1.481201171875, -1.3568115234375, -1.232421875, -1.1080322265625, -0.983642578125, -0.8592529296875, -0.73486328125, -0.6104736328125, -0.486083984375, -0.3616943359375, -0.2373046875, -0.1129150390625, 0.011474609375, 0.1358642578125, 0.26025390625, 0.3846435546875, 0.509033203125, 0.6334228515625, 0.7578125, 0.8822021484375, 1.006591796875, 1.1309814453125, 1.25537109375, 1.3797607421875, 1.504150390625, 1.6285400390625, 1.7529296875, 1.8773193359375, 2.001708984375, 2.1260986328125, 2.25048828125, 2.3748779296875, 2.499267578125, 2.6236572265625, 2.748046875, 2.8724365234375, 2.996826171875, 3.1212158203125, 3.24560546875, 3.3699951171875, 3.494384765625, 3.6187744140625, 3.7431640625, 3.8675537109375, 3.991943359375, 4.1163330078125, 4.24072265625, 4.3651123046875, 4.489501953125, 4.6138916015625, 4.73828125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 9.0, 8.0, 7.0, 9.0, 15.0, 26.0, 32.0, 48.0, 70.0, 95.0, 123.0, 167.0, 237.0, 338.0, 496.0, 739.0, 1094.0, 1665.0, 3382.0, 19995.0, 203257.0, 643476.0, 151008.0, 14445.0, 2866.0, 1548.0, 1069.0, 666.0, 514.0, 339.0, 224.0, 163.0, 140.0, 83.0, 64.0, 41.0, 28.0, 18.0, 14.0, 11.0, 7.0, 8.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0546875, -8.7666015625, -8.478515625, -8.1904296875, -7.90234375, -7.6142578125, -7.326171875, -7.0380859375, -6.75, -6.4619140625, -6.173828125, -5.8857421875, -5.59765625, -5.3095703125, -5.021484375, -4.7333984375, -4.4453125, -4.1572265625, -3.869140625, -3.5810546875, -3.29296875, -3.0048828125, -2.716796875, -2.4287109375, -2.140625, -1.8525390625, -1.564453125, -1.2763671875, -0.98828125, -0.7001953125, -0.412109375, -0.1240234375, 0.1640625, 0.4521484375, 0.740234375, 1.0283203125, 1.31640625, 1.6044921875, 1.892578125, 2.1806640625, 2.46875, 2.7568359375, 3.044921875, 3.3330078125, 3.62109375, 3.9091796875, 4.197265625, 4.4853515625, 4.7734375, 5.0615234375, 5.349609375, 5.6376953125, 5.92578125, 6.2138671875, 6.501953125, 6.7900390625, 7.078125, 7.3662109375, 7.654296875, 7.9423828125, 8.23046875, 8.5185546875, 8.806640625, 9.0947265625, 9.3828125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 7.0, 6.0, 3.0, 14.0, 13.0, 25.0, 22.0, 25.0, 31.0, 35.0, 35.0, 49.0, 41.0, 56.0, 99.0, 187.0, 1383.0, 357.0, 166.0, 74.0, 54.0, 45.0, 43.0, 43.0, 33.0, 33.0, 33.0, 18.0, 20.0, 24.0, 16.0, 11.0, 13.0, 6.0, 6.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.93359375, -8.625, -8.31640625, -8.0078125, -7.69921875, -7.390625, -7.08203125, -6.7734375, -6.46484375, -6.15625, -5.84765625, -5.5390625, -5.23046875, -4.921875, -4.61328125, -4.3046875, -3.99609375, -3.6875, -3.37890625, -3.0703125, -2.76171875, -2.453125, -2.14453125, -1.8359375, -1.52734375, -1.21875, -0.91015625, -0.6015625, -0.29296875, 0.015625, 0.32421875, 0.6328125, 0.94140625, 1.25, 1.55859375, 1.8671875, 2.17578125, 2.484375, 2.79296875, 3.1015625, 3.41015625, 3.71875, 4.02734375, 4.3359375, 4.64453125, 4.953125, 5.26171875, 5.5703125, 5.87890625, 6.1875, 6.49609375, 6.8046875, 7.11328125, 7.421875, 7.73046875, 8.0390625, 8.34765625, 8.65625, 8.96484375, 9.2734375, 9.58203125, 9.890625, 10.19921875, 10.5078125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 5.0, 6.0, 13.0, 15.0, 12.0, 13.0, 28.0, 48.0, 39.0, 73.0, 85.0, 124.0, 212.0, 326.0, 503.0, 983.0, 2631.0, 3111534.0, 25656.0, 1534.0, 678.0, 390.0, 252.0, 161.0, 114.0, 70.0, 45.0, 33.0, 31.0, 26.0, 17.0, 12.0, 11.0, 4.0, 5.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.375, -41.86669921875, -40.3583984375, -38.85009765625, -37.341796875, -35.83349609375, -34.3251953125, -32.81689453125, -31.30859375, -29.80029296875, -28.2919921875, -26.78369140625, -25.275390625, -23.76708984375, -22.2587890625, -20.75048828125, -19.2421875, -17.73388671875, -16.2255859375, -14.71728515625, -13.208984375, -11.70068359375, -10.1923828125, -8.68408203125, -7.17578125, -5.66748046875, -4.1591796875, -2.65087890625, -1.142578125, 0.36572265625, 1.8740234375, 3.38232421875, 4.890625, 6.39892578125, 7.9072265625, 9.41552734375, 10.923828125, 12.43212890625, 13.9404296875, 15.44873046875, 16.95703125, 18.46533203125, 19.9736328125, 21.48193359375, 22.990234375, 24.49853515625, 26.0068359375, 27.51513671875, 29.0234375, 30.53173828125, 32.0400390625, 33.54833984375, 35.056640625, 36.56494140625, 38.0732421875, 39.58154296875, 41.08984375, 42.59814453125, 44.1064453125, 45.61474609375, 47.123046875, 48.63134765625, 50.1396484375, 51.64794921875, 53.15625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 96.0, 623.0, 277.0, 16.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.67234802246094, -92.65572357177734, -89.63909912109375, -86.62247467041016, -83.60585021972656, -80.58922576904297, -77.57260131835938, -74.55597686767578, -71.53935241699219, -68.5227279663086, -65.506103515625, -62.489479064941406, -59.47285461425781, -56.45623016357422, -53.439605712890625, -50.42298126220703, -47.40635681152344, -44.389732360839844, -41.37310791015625, -38.356483459472656, -35.33985900878906, -32.32323455810547, -29.306610107421875, -26.28998565673828, -23.273361206054688, -20.256736755371094, -17.2401123046875, -14.223487854003906, -11.206863403320312, -8.190238952636719, -5.173614501953125, -2.1569900512695312, 0.8596343994140625, 3.8762588500976562, 6.89288330078125, 9.909507751464844, 12.926132202148438, 15.942756652832031, 18.959381103515625, 21.97600555419922, 24.992630004882812, 28.009254455566406, 31.02587890625, 34.042503356933594, 37.05912780761719, 40.07575225830078, 43.092376708984375, 46.10900115966797, 49.12562561035156, 52.142250061035156, 55.15887451171875, 58.175498962402344, 61.19212341308594, 64.20874786376953, 67.22537231445312, 70.24199676513672, 73.25862121582031, 76.2752456665039, 79.2918701171875, 82.3084945678711, 85.32511901855469, 88.34174346923828, 91.35836791992188, 94.37499237060547, 97.39161682128906]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 11.0, 7.0, 8.0, 12.0, 6.0, 13.0, 14.0, 12.0, 15.0, 20.0, 15.0, 22.0, 20.0, 31.0, 34.0, 27.0, 33.0, 38.0, 33.0, 40.0, 38.0, 32.0, 48.0, 37.0, 33.0, 36.0, 32.0, 39.0, 24.0, 28.0, 20.0, 19.0, 20.0, 26.0, 14.0, 20.0, 13.0, 22.0, 15.0, 14.0, 9.0, 13.0, 10.0, 5.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.73282241821289, -19.054611206054688, -18.376399993896484, -17.69818878173828, -17.01997947692871, -16.341768264770508, -15.663557052612305, -14.985345840454102, -14.307135581970215, -13.628924369812012, -12.950714111328125, -12.272502899169922, -11.594291687011719, -10.916081428527832, -10.237870216369629, -9.559659957885742, -8.881448745727539, -8.203237533569336, -7.525027275085449, -6.846816062927246, -6.168605327606201, -5.490394592285156, -4.812183380126953, -4.133972644805908, -3.4557619094848633, -2.7775511741638184, -2.0993402004241943, -1.4211292266845703, -0.7429184913635254, -0.06470775604248047, 0.6135034561157227, 1.2917141914367676, 1.9699249267578125, 2.6481356620788574, 3.3263466358184814, 4.0045576095581055, 4.68276834487915, 5.360979080200195, 6.039190292358398, 6.717401027679443, 7.395611763000488, 8.073822975158691, 8.752033233642578, 9.430244445800781, 10.108455657958984, 10.786665916442871, 11.464877128601074, 12.143087387084961, 12.821298599243164, 13.499509811401367, 14.177720069885254, 14.855931282043457, 15.534141540527344, 16.212352752685547, 16.89056396484375, 17.568775177001953, 18.246986389160156, 18.92519760131836, 19.603408813476562, 20.281620025634766, 20.959829330444336, 21.63804054260254, 22.316251754760742, 22.994462966918945, 23.672672271728516]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 10.0, 8.0, 12.0, 10.0, 14.0, 15.0, 26.0, 23.0, 20.0, 16.0, 29.0, 31.0, 44.0, 35.0, 30.0, 37.0, 41.0, 32.0, 41.0, 37.0, 38.0, 61.0, 24.0, 36.0, 37.0, 31.0, 34.0, 35.0, 23.0, 25.0, 20.0, 22.0, 19.0, 8.0, 9.0, 7.0, 6.0, 5.0, 3.0, 8.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.482421875, -3.370849609375, -3.25927734375, -3.147705078125, -3.0361328125, -2.924560546875, -2.81298828125, -2.701416015625, -2.58984375, -2.478271484375, -2.36669921875, -2.255126953125, -2.1435546875, -2.031982421875, -1.92041015625, -1.808837890625, -1.697265625, -1.585693359375, -1.47412109375, -1.362548828125, -1.2509765625, -1.139404296875, -1.02783203125, -0.916259765625, -0.8046875, -0.693115234375, -0.58154296875, -0.469970703125, -0.3583984375, -0.246826171875, -0.13525390625, -0.023681640625, 0.087890625, 0.199462890625, 0.31103515625, 0.422607421875, 0.5341796875, 0.645751953125, 0.75732421875, 0.868896484375, 0.98046875, 1.092041015625, 1.20361328125, 1.315185546875, 1.4267578125, 1.538330078125, 1.64990234375, 1.761474609375, 1.873046875, 1.984619140625, 2.09619140625, 2.207763671875, 2.3193359375, 2.430908203125, 2.54248046875, 2.654052734375, 2.765625, 2.877197265625, 2.98876953125, 3.100341796875, 3.2119140625, 3.323486328125, 3.43505859375, 3.546630859375, 3.658203125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 8.0, 8.0, 14.0, 21.0, 23.0, 36.0, 40.0, 63.0, 70.0, 96.0, 138.0, 218.0, 345.0, 708.0, 1697.0, 4722.0, 20872.0, 132152.0, 822998.0, 2181145.0, 864629.0, 134618.0, 21203.0, 5083.0, 1576.0, 680.0, 356.0, 226.0, 128.0, 99.0, 61.0, 67.0, 33.0, 32.0, 25.0, 25.0, 14.0, 20.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40625, -5.20233154296875, -4.9984130859375, -4.79449462890625, -4.590576171875, -4.38665771484375, -4.1827392578125, -3.97882080078125, -3.77490234375, -3.57098388671875, -3.3670654296875, -3.16314697265625, -2.959228515625, -2.75531005859375, -2.5513916015625, -2.34747314453125, -2.1435546875, -1.93963623046875, -1.7357177734375, -1.53179931640625, -1.327880859375, -1.12396240234375, -0.9200439453125, -0.71612548828125, -0.51220703125, -0.30828857421875, -0.1043701171875, 0.09954833984375, 0.303466796875, 0.50738525390625, 0.7113037109375, 0.91522216796875, 1.119140625, 1.32305908203125, 1.5269775390625, 1.73089599609375, 1.934814453125, 2.13873291015625, 2.3426513671875, 2.54656982421875, 2.75048828125, 2.95440673828125, 3.1583251953125, 3.36224365234375, 3.566162109375, 3.77008056640625, 3.9739990234375, 4.17791748046875, 4.3818359375, 4.58575439453125, 4.7896728515625, 4.99359130859375, 5.197509765625, 5.40142822265625, 5.6053466796875, 5.80926513671875, 6.01318359375, 6.21710205078125, 6.4210205078125, 6.62493896484375, 6.828857421875, 7.03277587890625, 7.2366943359375, 7.44061279296875, 7.64453125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 9.0, 6.0, 6.0, 8.0, 15.0, 17.0, 28.0, 26.0, 42.0, 60.0, 74.0, 102.0, 139.0, 170.0, 209.0, 304.0, 411.0, 483.0, 467.0, 379.0, 258.0, 201.0, 120.0, 112.0, 104.0, 69.0, 43.0, 37.0, 41.0, 37.0, 25.0, 26.0, 10.0, 8.0, 5.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.18121337890625, -4.9796142578125, -4.77801513671875, -4.576416015625, -4.37481689453125, -4.1732177734375, -3.97161865234375, -3.77001953125, -3.56842041015625, -3.3668212890625, -3.16522216796875, -2.963623046875, -2.76202392578125, -2.5604248046875, -2.35882568359375, -2.1572265625, -1.95562744140625, -1.7540283203125, -1.55242919921875, -1.350830078125, -1.14923095703125, -0.9476318359375, -0.74603271484375, -0.54443359375, -0.34283447265625, -0.1412353515625, 0.06036376953125, 0.261962890625, 0.46356201171875, 0.6651611328125, 0.86676025390625, 1.068359375, 1.26995849609375, 1.4715576171875, 1.67315673828125, 1.874755859375, 2.07635498046875, 2.2779541015625, 2.47955322265625, 2.68115234375, 2.88275146484375, 3.0843505859375, 3.28594970703125, 3.487548828125, 3.68914794921875, 3.8907470703125, 4.09234619140625, 4.2939453125, 4.49554443359375, 4.6971435546875, 4.89874267578125, 5.100341796875, 5.30194091796875, 5.5035400390625, 5.70513916015625, 5.90673828125, 6.10833740234375, 6.3099365234375, 6.51153564453125, 6.713134765625, 6.91473388671875, 7.1163330078125, 7.31793212890625, 7.51953125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 17.0, 29.0, 68.0, 130.0, 218.0, 453.0, 1042.0, 3322.0, 77903.0, 3900632.0, 203974.0, 4366.0, 1177.0, 467.0, 227.0, 114.0, 54.0, 33.0, 15.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.28125, -26.609130859375, -25.93701171875, -25.264892578125, -24.5927734375, -23.920654296875, -23.24853515625, -22.576416015625, -21.904296875, -21.232177734375, -20.56005859375, -19.887939453125, -19.2158203125, -18.543701171875, -17.87158203125, -17.199462890625, -16.52734375, -15.855224609375, -15.18310546875, -14.510986328125, -13.8388671875, -13.166748046875, -12.49462890625, -11.822509765625, -11.150390625, -10.478271484375, -9.80615234375, -9.134033203125, -8.4619140625, -7.789794921875, -7.11767578125, -6.445556640625, -5.7734375, -5.101318359375, -4.42919921875, -3.757080078125, -3.0849609375, -2.412841796875, -1.74072265625, -1.068603515625, -0.396484375, 0.275634765625, 0.94775390625, 1.619873046875, 2.2919921875, 2.964111328125, 3.63623046875, 4.308349609375, 4.98046875, 5.652587890625, 6.32470703125, 6.996826171875, 7.6689453125, 8.341064453125, 9.01318359375, 9.685302734375, 10.357421875, 11.029541015625, 11.70166015625, 12.373779296875, 13.0458984375, 13.718017578125, 14.39013671875, 15.062255859375, 15.734375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 21.0, 670.0, 321.0, 4.0, 1.0, 1.0, 1.0], "bins": [-442.0586853027344, -434.54180908203125, -427.0249328613281, -419.5080871582031, -411.9912109375, -404.4743347167969, -396.95745849609375, -389.44061279296875, -381.9237365722656, -374.4068603515625, -366.8899841308594, -359.3731384277344, -351.85626220703125, -344.3393859863281, -336.822509765625, -329.3056640625, -321.78875732421875, -314.2718811035156, -306.7550048828125, -299.2381591796875, -291.7212829589844, -284.20440673828125, -276.6875305175781, -269.170654296875, -261.65380859375, -254.13693237304688, -246.6200714111328, -239.1031951904297, -231.58633422851562, -224.0694580078125, -216.55258178710938, -209.0357208251953, -201.5188446044922, -194.00196838378906, -186.485107421875, -178.96823120117188, -171.4513702392578, -163.9344940185547, -156.41763305664062, -148.9007568359375, -141.38389587402344, -133.8670196533203, -126.35015869140625, -118.83328247070312, -111.31642150878906, -103.79954528808594, -96.28267669677734, -88.76580810546875, -81.24893188476562, -73.73206329345703, -66.21519470214844, -58.69832229614258, -51.181453704833984, -43.66458511352539, -36.14771270751953, -28.630844116210938, -21.11397933959961, -13.5971097946167, -6.080240249633789, 1.4366302490234375, 8.953498840332031, 16.470367431640625, 23.987239837646484, 31.504108428955078, 39.02097702026367]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 3.0, 4.0, 8.0, 4.0, 8.0, 8.0, 17.0, 12.0, 20.0, 27.0, 18.0, 34.0, 28.0, 19.0, 32.0, 38.0, 36.0, 46.0, 41.0, 40.0, 40.0, 42.0, 45.0, 36.0, 53.0, 36.0, 30.0, 38.0, 33.0, 31.0, 30.0, 25.0, 20.0, 22.0, 9.0, 16.0, 8.0, 12.0, 7.0, 10.0, 7.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.018861770629883, -22.141508102416992, -21.264156341552734, -20.386802673339844, -19.509449005126953, -18.632095336914062, -17.754741668701172, -16.877389907836914, -16.000036239624023, -15.122682571411133, -14.245329856872559, -13.367977142333984, -12.490623474121094, -11.613269805908203, -10.735917091369629, -9.858564376831055, -8.981210708618164, -8.103857040405273, -7.226504325866699, -6.349151134490967, -5.471797943115234, -4.594444751739502, -3.7170915603637695, -2.839738368988037, -1.9623851776123047, -1.0850319862365723, -0.20767879486083984, 0.6696743965148926, 1.547027587890625, 2.4243807792663574, 3.30173397064209, 4.179087162017822, 5.056438446044922, 5.933791637420654, 6.811144828796387, 7.688498020172119, 8.565851211547852, 9.443204879760742, 10.320557594299316, 11.19791030883789, 12.075263977050781, 12.952617645263672, 13.829970359802246, 14.70732307434082, 15.584676742553711, 16.4620304107666, 17.33938217163086, 18.21673583984375, 19.09408950805664, 19.97144317626953, 20.848796844482422, 21.72614860534668, 22.60350227355957, 23.48085594177246, 24.35820770263672, 25.23556137084961, 26.1129150390625, 26.99026870727539, 27.86762237548828, 28.74497413635254, 29.62232780456543, 30.49968147277832, 31.377033233642578, 32.25438690185547, 33.13174057006836]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 8.0, 7.0, 22.0, 19.0, 16.0, 17.0, 33.0, 28.0, 44.0, 35.0, 43.0, 44.0, 35.0, 47.0, 37.0, 39.0, 43.0, 46.0, 47.0, 48.0, 41.0, 37.0, 36.0, 31.0, 30.0, 28.0, 24.0, 19.0, 22.0, 9.0, 17.0, 18.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.120361328125, -3.01611328125, -2.911865234375, -2.8076171875, -2.703369140625, -2.59912109375, -2.494873046875, -2.390625, -2.286376953125, -2.18212890625, -2.077880859375, -1.9736328125, -1.869384765625, -1.76513671875, -1.660888671875, -1.556640625, -1.452392578125, -1.34814453125, -1.243896484375, -1.1396484375, -1.035400390625, -0.93115234375, -0.826904296875, -0.72265625, -0.618408203125, -0.51416015625, -0.409912109375, -0.3056640625, -0.201416015625, -0.09716796875, 0.007080078125, 0.111328125, 0.215576171875, 0.31982421875, 0.424072265625, 0.5283203125, 0.632568359375, 0.73681640625, 0.841064453125, 0.9453125, 1.049560546875, 1.15380859375, 1.258056640625, 1.3623046875, 1.466552734375, 1.57080078125, 1.675048828125, 1.779296875, 1.883544921875, 1.98779296875, 2.092041015625, 2.1962890625, 2.300537109375, 2.40478515625, 2.509033203125, 2.61328125, 2.717529296875, 2.82177734375, 2.926025390625, 3.0302734375, 3.134521484375, 3.23876953125, 3.343017578125, 3.447265625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 22.0, 22.0, 36.0, 56.0, 81.0, 116.0, 189.0, 295.0, 469.0, 914.0, 1626.0, 2999.0, 5347.0, 10448.0, 20379.0, 39735.0, 81972.0, 197362.0, 377599.0, 164137.0, 71598.0, 34877.0, 17890.0, 9360.0, 4921.0, 2665.0, 1437.0, 830.0, 441.0, 259.0, 153.0, 103.0, 74.0, 43.0, 24.0, 18.0, 18.0, 8.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7568359375, -0.7334823608398438, -0.7101287841796875, -0.6867752075195312, -0.663421630859375, -0.6400680541992188, -0.6167144775390625, -0.5933609008789062, -0.57000732421875, -0.5466537475585938, -0.5233001708984375, -0.49994659423828125, -0.476593017578125, -0.45323944091796875, -0.4298858642578125, -0.40653228759765625, -0.3831787109375, -0.35982513427734375, -0.3364715576171875, -0.31311798095703125, -0.289764404296875, -0.26641082763671875, -0.2430572509765625, -0.21970367431640625, -0.19635009765625, -0.17299652099609375, -0.1496429443359375, -0.12628936767578125, -0.102935791015625, -0.07958221435546875, -0.0562286376953125, -0.03287506103515625, -0.009521484375, 0.01383209228515625, 0.0371856689453125, 0.06053924560546875, 0.083892822265625, 0.10724639892578125, 0.1305999755859375, 0.15395355224609375, 0.17730712890625, 0.20066070556640625, 0.2240142822265625, 0.24736785888671875, 0.270721435546875, 0.29407501220703125, 0.3174285888671875, 0.34078216552734375, 0.3641357421875, 0.38748931884765625, 0.4108428955078125, 0.43419647216796875, 0.457550048828125, 0.48090362548828125, 0.5042572021484375, 0.5276107788085938, 0.55096435546875, 0.5743179321289062, 0.5976715087890625, 0.6210250854492188, 0.644378662109375, 0.6677322387695312, 0.6910858154296875, 0.7144393920898438, 0.73779296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 10.0, 9.0, 4.0, 8.0, 13.0, 12.0, 15.0, 9.0, 23.0, 20.0, 24.0, 28.0, 31.0, 29.0, 27.0, 37.0, 33.0, 34.0, 33.0, 30.0, 43.0, 1061.0, 37.0, 36.0, 39.0, 41.0, 28.0, 30.0, 42.0, 23.0, 31.0, 22.0, 21.0, 20.0, 17.0, 15.0, 24.0, 13.0, 9.0, 8.0, 4.0, 9.0, 5.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8125, -1.7574005126953125, -1.702301025390625, -1.6472015380859375, -1.59210205078125, -1.5370025634765625, -1.481903076171875, -1.4268035888671875, -1.3717041015625, -1.3166046142578125, -1.261505126953125, -1.2064056396484375, -1.15130615234375, -1.0962066650390625, -1.041107177734375, -0.9860076904296875, -0.930908203125, -0.8758087158203125, -0.820709228515625, -0.7656097412109375, -0.71051025390625, -0.6554107666015625, -0.600311279296875, -0.5452117919921875, -0.4901123046875, -0.4350128173828125, -0.379913330078125, -0.3248138427734375, -0.26971435546875, -0.2146148681640625, -0.159515380859375, -0.1044158935546875, -0.04931640625, 0.0057830810546875, 0.060882568359375, 0.1159820556640625, 0.17108154296875, 0.2261810302734375, 0.281280517578125, 0.3363800048828125, 0.3914794921875, 0.4465789794921875, 0.501678466796875, 0.5567779541015625, 0.61187744140625, 0.6669769287109375, 0.722076416015625, 0.7771759033203125, 0.832275390625, 0.8873748779296875, 0.942474365234375, 0.9975738525390625, 1.05267333984375, 1.1077728271484375, 1.162872314453125, 1.2179718017578125, 1.2730712890625, 1.3281707763671875, 1.383270263671875, 1.4383697509765625, 1.49346923828125, 1.5485687255859375, 1.603668212890625, 1.6587677001953125, 1.7138671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 7.0, 11.0, 18.0, 28.0, 49.0, 65.0, 78.0, 138.0, 161.0, 286.0, 336.0, 520.0, 763.0, 1093.0, 1615.0, 2277.0, 3334.0, 4879.0, 7418.0, 10953.0, 17045.0, 26284.0, 42322.0, 69424.0, 124134.0, 1310190.0, 207712.0, 101709.0, 59334.0, 36393.0, 23016.0, 15004.0, 9754.0, 6582.0, 4515.0, 3013.0, 2109.0, 1421.0, 969.0, 687.0, 488.0, 319.0, 218.0, 157.0, 109.0, 59.0, 42.0, 32.0, 27.0, 13.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.499755859375, -0.4845390319824219, -0.46932220458984375, -0.4541053771972656, -0.4388885498046875, -0.4236717224121094, -0.40845489501953125, -0.3932380676269531, -0.378021240234375, -0.3628044128417969, -0.34758758544921875, -0.3323707580566406, -0.3171539306640625, -0.3019371032714844, -0.28672027587890625, -0.2715034484863281, -0.25628662109375, -0.24106979370117188, -0.22585296630859375, -0.21063613891601562, -0.1954193115234375, -0.18020248413085938, -0.16498565673828125, -0.14976882934570312, -0.134552001953125, -0.11933517456054688, -0.10411834716796875, -0.08890151977539062, -0.0736846923828125, -0.058467864990234375, -0.04325103759765625, -0.028034210205078125, -0.0128173828125, 0.002399444580078125, 0.01761627197265625, 0.032833099365234375, 0.0480499267578125, 0.06326675415039062, 0.07848358154296875, 0.09370040893554688, 0.108917236328125, 0.12413406372070312, 0.13935089111328125, 0.15456771850585938, 0.1697845458984375, 0.18500137329101562, 0.20021820068359375, 0.21543502807617188, 0.23065185546875, 0.24586868286132812, 0.26108551025390625, 0.2763023376464844, 0.2915191650390625, 0.3067359924316406, 0.32195281982421875, 0.3371696472167969, 0.352386474609375, 0.3676033020019531, 0.38282012939453125, 0.3980369567871094, 0.4132537841796875, 0.4284706115722656, 0.44368743896484375, 0.4589042663574219, 0.47412109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 4.0, 9.0, 11.0, 12.0, 14.0, 11.0, 14.0, 23.0, 27.0, 22.0, 36.0, 42.0, 41.0, 45.0, 51.0, 37.0, 57.0, 57.0, 65.0, 46.0, 57.0, 49.0, 34.0, 35.0, 34.0, 25.0, 23.0, 11.0, 17.0, 14.0, 16.0, 11.0, 9.0, 7.0, 10.0, 2.0, 2.0, 3.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003428459167480469, -0.00033260881900787354, -0.0003223717212677002, -0.00031213462352752686, -0.0003018975257873535, -0.0002916604280471802, -0.00028142333030700684, -0.0002711862325668335, -0.00026094913482666016, -0.0002507120370864868, -0.00024047493934631348, -0.00023023784160614014, -0.0002200007438659668, -0.00020976364612579346, -0.00019952654838562012, -0.00018928945064544678, -0.00017905235290527344, -0.0001688152551651001, -0.00015857815742492676, -0.00014834105968475342, -0.00013810396194458008, -0.00012786686420440674, -0.0001176297664642334, -0.00010739266872406006, -9.715557098388672e-05, -8.691847324371338e-05, -7.668137550354004e-05, -6.64442777633667e-05, -5.620718002319336e-05, -4.597008228302002e-05, -3.573298454284668e-05, -2.549588680267334e-05, -1.52587890625e-05, -5.02169132232666e-06, 5.21540641784668e-06, 1.545250415802002e-05, 2.568960189819336e-05, 3.59266996383667e-05, 4.616379737854004e-05, 5.640089511871338e-05, 6.663799285888672e-05, 7.687509059906006e-05, 8.71121883392334e-05, 9.734928607940674e-05, 0.00010758638381958008, 0.00011782348155975342, 0.00012806057929992676, 0.0001382976770401001, 0.00014853477478027344, 0.00015877187252044678, 0.00016900897026062012, 0.00017924606800079346, 0.0001894831657409668, 0.00019972026348114014, 0.00020995736122131348, 0.00022019445896148682, 0.00023043155670166016, 0.0002406686544418335, 0.00025090575218200684, 0.0002611428499221802, 0.0002713799476623535, 0.00028161704540252686, 0.0002918541431427002, 0.00030209124088287354, 0.0003123283386230469]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 2.0, 12.0, 11.0, 8.0, 29.0, 32.0, 30.0, 45.0, 53.0, 53.0, 50.0, 128.0, 155.0, 233.0, 327.0, 545.0, 931.0, 8711.0, 1024078.0, 10307.0, 972.0, 542.0, 363.0, 242.0, 175.0, 121.0, 78.0, 62.0, 39.0, 39.0, 26.0, 38.0, 26.0, 11.0, 18.0, 9.0, 11.0, 7.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006000518798828125, -0.005810141563415527, -0.00561976432800293, -0.005429387092590332, -0.005239009857177734, -0.005048632621765137, -0.004858255386352539, -0.004667878150939941, -0.004477500915527344, -0.004287123680114746, -0.0040967464447021484, -0.003906369209289551, -0.003715991973876953, -0.0035256147384643555, -0.003335237503051758, -0.00314486026763916, -0.0029544830322265625, -0.002764105796813965, -0.002573728561401367, -0.0023833513259887695, -0.002192974090576172, -0.0020025968551635742, -0.0018122196197509766, -0.001621842384338379, -0.0014314651489257812, -0.0012410879135131836, -0.001050710678100586, -0.0008603334426879883, -0.0006699562072753906, -0.00047957897186279297, -0.0002892017364501953, -9.882450103759766e-05, 9.1552734375e-05, 0.00028192996978759766, 0.0004723072052001953, 0.000662684440612793, 0.0008530616760253906, 0.0010434389114379883, 0.001233816146850586, 0.0014241933822631836, 0.0016145706176757812, 0.001804947853088379, 0.0019953250885009766, 0.0021857023239135742, 0.002376079559326172, 0.0025664567947387695, 0.002756834030151367, 0.002947211265563965, 0.0031375885009765625, 0.00332796573638916, 0.003518342971801758, 0.0037087202072143555, 0.003899097442626953, 0.004089474678039551, 0.0042798519134521484, 0.004470229148864746, 0.004660606384277344, 0.004850983619689941, 0.005041360855102539, 0.005231738090515137, 0.005422115325927734, 0.005612492561340332, 0.00580286979675293, 0.005993247032165527, 0.006183624267578125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 22.0, 178.0, 537.0, 247.0, 28.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006031366647221148, -0.0005752437864430249, -0.0005473509663715959, -0.0005194580880925059, -0.0004915652680210769, -0.000463672389741987, -0.0004357795405667275, -0.00040788669139146805, -0.0003799938422162086, -0.0003521009930409491, -0.00032420814386568964, -0.00029631529469043016, -0.00026842241641134024, -0.000240529581787996, -0.0002126367180608213, -0.00018474386888556182, -0.00015685101971030235, -0.00012895817053504288, -0.0001010653140838258, -7.317245763260871e-05, -4.527960845734924e-05, -1.738675928208977e-05, 1.050610444508493e-05, 3.83989536203444e-05, 6.629180279560387e-05, 9.418465197086334e-05, 0.0001220775011461228, 0.0001499703648732975, 0.00017786321404855698, 0.00020575606322381645, 0.00023364892695099115, 0.0002615417761262506, 0.000289434683509171, 0.0003173275326844305, 0.00034522038185968995, 0.0003731132601387799, 0.0004010060802102089, 0.0004288989584892988, 0.0004567918076645583, 0.00048468465683981776, 0.0005125774769112468, 0.0005404703551903367, 0.0005683631752617657, 0.0005962560535408556, 0.0006241488736122847, 0.0006520417518913746, 0.0006799346301704645, 0.0007078274502418935, 0.0007357203285209835, 0.0007636132068000734, 0.0007915060268715024, 0.0008193989051505923, 0.0008472917252220213, 0.0008751846035011113, 0.0009030774235725403, 0.0009309703018516302, 0.0009588631801307201, 0.00098675605840981, 0.0010146489366889, 0.001042541698552668, 0.001070434576831758, 0.001098327455110848, 0.0011262203333899379, 0.001154113095253706, 0.001182005973532796]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 10.0, 5.0, 10.0, 11.0, 8.0, 12.0, 12.0, 24.0, 20.0, 32.0, 20.0, 29.0, 30.0, 28.0, 44.0, 31.0, 32.0, 41.0, 38.0, 44.0, 36.0, 40.0, 34.0, 37.0, 40.0, 48.0, 29.0, 29.0, 37.0, 26.0, 23.0, 21.0, 21.0, 12.0, 8.0, 14.0, 13.0, 14.0, 7.0, 9.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00020492076873779297, -0.0001990925520658493, -0.00019326433539390564, -0.00018743611872196198, -0.0001816079020500183, -0.00017577968537807465, -0.00016995146870613098, -0.00016412325203418732, -0.00015829503536224365, -0.0001524668186903, -0.00014663860201835632, -0.00014081038534641266, -0.000134982168674469, -0.00012915395200252533, -0.00012332573533058167, -0.000117497518658638, -0.00011166930198669434, -0.00010584108531475067, -0.00010001286864280701, -9.418465197086334e-05, -8.835643529891968e-05, -8.252821862697601e-05, -7.670000195503235e-05, -7.087178528308868e-05, -6.504356861114502e-05, -5.9215351939201355e-05, -5.338713526725769e-05, -4.7558918595314026e-05, -4.173070192337036e-05, -3.59024852514267e-05, -3.0074268579483032e-05, -2.4246051907539368e-05, -1.8417835235595703e-05, -1.2589618563652039e-05, -6.761401891708374e-06, -9.331852197647095e-07, 4.895031452178955e-06, 1.072324812412262e-05, 1.6551464796066284e-05, 2.237968146800995e-05, 2.8207898139953613e-05, 3.403611481189728e-05, 3.986433148384094e-05, 4.569254815578461e-05, 5.152076482772827e-05, 5.7348981499671936e-05, 6.31771981716156e-05, 6.900541484355927e-05, 7.483363151550293e-05, 8.06618481874466e-05, 8.649006485939026e-05, 9.231828153133392e-05, 9.814649820327759e-05, 0.00010397471487522125, 0.00010980293154716492, 0.00011563114821910858, 0.00012145936489105225, 0.0001272875815629959, 0.00013311579823493958, 0.00013894401490688324, 0.0001447722315788269, 0.00015060044825077057, 0.00015642866492271423, 0.0001622568815946579, 0.00016808509826660156]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 8.0, 7.0, 22.0, 19.0, 16.0, 17.0, 33.0, 28.0, 44.0, 35.0, 43.0, 44.0, 35.0, 47.0, 37.0, 39.0, 43.0, 46.0, 47.0, 48.0, 41.0, 37.0, 36.0, 31.0, 30.0, 28.0, 24.0, 19.0, 22.0, 9.0, 17.0, 18.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.120361328125, -3.01611328125, -2.911865234375, -2.8076171875, -2.703369140625, -2.59912109375, -2.494873046875, -2.390625, -2.286376953125, -2.18212890625, -2.077880859375, -1.9736328125, -1.869384765625, -1.76513671875, -1.660888671875, -1.556640625, -1.452392578125, -1.34814453125, -1.243896484375, -1.1396484375, -1.035400390625, -0.93115234375, -0.826904296875, -0.72265625, -0.618408203125, -0.51416015625, -0.409912109375, -0.3056640625, -0.201416015625, -0.09716796875, 0.007080078125, 0.111328125, 0.215576171875, 0.31982421875, 0.424072265625, 0.5283203125, 0.632568359375, 0.73681640625, 0.841064453125, 0.9453125, 1.049560546875, 1.15380859375, 1.258056640625, 1.3623046875, 1.466552734375, 1.57080078125, 1.675048828125, 1.779296875, 1.883544921875, 1.98779296875, 2.092041015625, 2.1962890625, 2.300537109375, 2.40478515625, 2.509033203125, 2.61328125, 2.717529296875, 2.82177734375, 2.926025390625, 3.0302734375, 3.134521484375, 3.23876953125, 3.343017578125, 3.447265625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 10.0, 17.0, 18.0, 29.0, 45.0, 63.0, 97.0, 143.0, 173.0, 244.0, 349.0, 455.0, 707.0, 893.0, 1383.0, 2008.0, 3137.0, 5821.0, 27725.0, 362120.0, 577609.0, 47385.0, 7361.0, 3504.0, 2227.0, 1514.0, 993.0, 747.0, 506.0, 356.0, 276.0, 184.0, 154.0, 82.0, 72.0, 42.0, 34.0, 24.0, 15.0, 11.0, 0.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.75, -8.4857177734375, -8.221435546875, -7.9571533203125, -7.69287109375, -7.4285888671875, -7.164306640625, -6.9000244140625, -6.6357421875, -6.3714599609375, -6.107177734375, -5.8428955078125, -5.57861328125, -5.3143310546875, -5.050048828125, -4.7857666015625, -4.521484375, -4.2572021484375, -3.992919921875, -3.7286376953125, -3.46435546875, -3.2000732421875, -2.935791015625, -2.6715087890625, -2.4072265625, -2.1429443359375, -1.878662109375, -1.6143798828125, -1.35009765625, -1.0858154296875, -0.821533203125, -0.5572509765625, -0.29296875, -0.0286865234375, 0.235595703125, 0.4998779296875, 0.76416015625, 1.0284423828125, 1.292724609375, 1.5570068359375, 1.8212890625, 2.0855712890625, 2.349853515625, 2.6141357421875, 2.87841796875, 3.1427001953125, 3.406982421875, 3.6712646484375, 3.935546875, 4.1998291015625, 4.464111328125, 4.7283935546875, 4.99267578125, 5.2569580078125, 5.521240234375, 5.7855224609375, 6.0498046875, 6.3140869140625, 6.578369140625, 6.8426513671875, 7.10693359375, 7.3712158203125, 7.635498046875, 7.8997802734375, 8.1640625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 6.0, 9.0, 18.0, 16.0, 16.0, 31.0, 39.0, 30.0, 40.0, 56.0, 59.0, 73.0, 151.0, 1556.0, 408.0, 143.0, 59.0, 51.0, 51.0, 35.0, 34.0, 32.0, 21.0, 22.0, 17.0, 12.0, 8.0, 7.0, 7.0, 7.0, 8.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.8170166015625, -9.509033203125, -9.2010498046875, -8.89306640625, -8.5850830078125, -8.277099609375, -7.9691162109375, -7.6611328125, -7.3531494140625, -7.045166015625, -6.7371826171875, -6.42919921875, -6.1212158203125, -5.813232421875, -5.5052490234375, -5.197265625, -4.8892822265625, -4.581298828125, -4.2733154296875, -3.96533203125, -3.6573486328125, -3.349365234375, -3.0413818359375, -2.7333984375, -2.4254150390625, -2.117431640625, -1.8094482421875, -1.50146484375, -1.1934814453125, -0.885498046875, -0.5775146484375, -0.26953125, 0.0384521484375, 0.346435546875, 0.6544189453125, 0.96240234375, 1.2703857421875, 1.578369140625, 1.8863525390625, 2.1943359375, 2.5023193359375, 2.810302734375, 3.1182861328125, 3.42626953125, 3.7342529296875, 4.042236328125, 4.3502197265625, 4.658203125, 4.9661865234375, 5.274169921875, 5.5821533203125, 5.89013671875, 6.1981201171875, 6.506103515625, 6.8140869140625, 7.1220703125, 7.4300537109375, 7.738037109375, 8.0460205078125, 8.35400390625, 8.6619873046875, 8.969970703125, 9.2779541015625, 9.5859375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 4.0, 8.0, 3.0, 10.0, 16.0, 11.0, 29.0, 24.0, 51.0, 97.0, 129.0, 211.0, 361.0, 746.0, 2077.0, 2858284.0, 280134.0, 1874.0, 700.0, 345.0, 222.0, 108.0, 90.0, 42.0, 39.0, 26.0, 22.0, 11.0, 8.0, 4.0, 2.0, 1.0, 6.0, 2.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.0625, -41.6708984375, -40.279296875, -38.8876953125, -37.49609375, -36.1044921875, -34.712890625, -33.3212890625, -31.9296875, -30.5380859375, -29.146484375, -27.7548828125, -26.36328125, -24.9716796875, -23.580078125, -22.1884765625, -20.796875, -19.4052734375, -18.013671875, -16.6220703125, -15.23046875, -13.8388671875, -12.447265625, -11.0556640625, -9.6640625, -8.2724609375, -6.880859375, -5.4892578125, -4.09765625, -2.7060546875, -1.314453125, 0.0771484375, 1.46875, 2.8603515625, 4.251953125, 5.6435546875, 7.03515625, 8.4267578125, 9.818359375, 11.2099609375, 12.6015625, 13.9931640625, 15.384765625, 16.7763671875, 18.16796875, 19.5595703125, 20.951171875, 22.3427734375, 23.734375, 25.1259765625, 26.517578125, 27.9091796875, 29.30078125, 30.6923828125, 32.083984375, 33.4755859375, 34.8671875, 36.2587890625, 37.650390625, 39.0419921875, 40.43359375, 41.8251953125, 43.216796875, 44.6083984375, 46.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 18.0, 181.0, 554.0, 224.0, 31.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.19784545898438, -140.66525268554688, -138.13265991210938, -135.6000518798828, -133.0674591064453, -130.5348663330078, -128.00225830078125, -125.46966552734375, -122.93707275390625, -120.40447998046875, -117.87187957763672, -115.33927917480469, -112.80668640136719, -110.27409362792969, -107.74149322509766, -105.20889282226562, -102.67630004882812, -100.14370727539062, -97.6111068725586, -95.07850646972656, -92.54591369628906, -90.01332092285156, -87.48072052001953, -84.9481201171875, -82.41552734375, -79.8829345703125, -77.35033416748047, -74.81773376464844, -72.28514099121094, -69.75254821777344, -67.2199478149414, -64.68734741210938, -62.15475082397461, -59.622154235839844, -57.08955764770508, -54.55696105957031, -52.02436447143555, -49.49176788330078, -46.959171295166016, -44.42657470703125, -41.893978118896484, -39.36138153076172, -36.82878494262695, -34.29618835449219, -31.763591766357422, -29.230995178222656, -26.69839859008789, -24.165802001953125, -21.63320541381836, -19.100608825683594, -16.568012237548828, -14.035415649414062, -11.502819061279297, -8.970222473144531, -6.437625885009766, -3.905029296875, -1.3724327087402344, 1.1601638793945312, 3.692760467529297, 6.2253570556640625, 8.757953643798828, 11.290550231933594, 13.82314682006836, 16.355743408203125, 18.88833999633789]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 2.0, 7.0, 8.0, 12.0, 11.0, 19.0, 18.0, 19.0, 21.0, 27.0, 31.0, 28.0, 35.0, 28.0, 36.0, 33.0, 41.0, 37.0, 39.0, 48.0, 48.0, 48.0, 51.0, 42.0, 33.0, 36.0, 40.0, 25.0, 27.0, 27.0, 16.0, 12.0, 21.0, 18.0, 8.0, 14.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-30.263473510742188, -29.354202270507812, -28.444929122924805, -27.53565788269043, -26.626384735107422, -25.717113494873047, -24.807842254638672, -23.898571014404297, -22.98929786682129, -22.080026626586914, -21.170753479003906, -20.26148223876953, -19.352210998535156, -18.44293785095215, -17.533666610717773, -16.624393463134766, -15.71512222290039, -14.8058500289917, -13.896577835083008, -12.987306594848633, -12.078034400939941, -11.16876220703125, -10.259490966796875, -9.350218772888184, -8.440946578979492, -7.531674385070801, -6.622402667999268, -5.713130950927734, -4.803858757019043, -3.8945865631103516, -2.9853148460388184, -2.076043128967285, -1.166769027709961, -0.25749707221984863, 0.6517748832702637, 1.561046838760376, 2.4703187942504883, 3.3795909881591797, 4.288862705230713, 5.198134422302246, 6.1074066162109375, 7.016678810119629, 7.925950527191162, 8.835222244262695, 9.744494438171387, 10.653766632080078, 11.563037872314453, 12.472310066223145, 13.381582260131836, 14.290854454040527, 15.200126647949219, 16.109397888183594, 17.01866912841797, 17.927942276000977, 18.83721351623535, 19.74648666381836, 20.655757904052734, 21.56502914428711, 22.474302291870117, 23.383573532104492, 24.2928466796875, 25.202117919921875, 26.11138916015625, 27.020660400390625, 27.929933547973633]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 13.0, 13.0, 13.0, 20.0, 25.0, 17.0, 20.0, 31.0, 28.0, 26.0, 36.0, 32.0, 43.0, 35.0, 37.0, 34.0, 42.0, 45.0, 29.0, 39.0, 24.0, 46.0, 40.0, 38.0, 28.0, 41.0, 29.0, 31.0, 21.0, 18.0, 17.0, 12.0, 20.0, 7.0, 4.0, 6.0, 8.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.373046875, -3.27398681640625, -3.1749267578125, -3.07586669921875, -2.976806640625, -2.87774658203125, -2.7786865234375, -2.67962646484375, -2.58056640625, -2.48150634765625, -2.3824462890625, -2.28338623046875, -2.184326171875, -2.08526611328125, -1.9862060546875, -1.88714599609375, -1.7880859375, -1.68902587890625, -1.5899658203125, -1.49090576171875, -1.391845703125, -1.29278564453125, -1.1937255859375, -1.09466552734375, -0.99560546875, -0.89654541015625, -0.7974853515625, -0.69842529296875, -0.599365234375, -0.50030517578125, -0.4012451171875, -0.30218505859375, -0.203125, -0.10406494140625, -0.0050048828125, 0.09405517578125, 0.193115234375, 0.29217529296875, 0.3912353515625, 0.49029541015625, 0.58935546875, 0.68841552734375, 0.7874755859375, 0.88653564453125, 0.985595703125, 1.08465576171875, 1.1837158203125, 1.28277587890625, 1.3818359375, 1.48089599609375, 1.5799560546875, 1.67901611328125, 1.778076171875, 1.87713623046875, 1.9761962890625, 2.07525634765625, 2.17431640625, 2.27337646484375, 2.3724365234375, 2.47149658203125, 2.570556640625, 2.66961669921875, 2.7686767578125, 2.86773681640625, 2.966796875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 5.0, 13.0, 11.0, 26.0, 17.0, 34.0, 37.0, 31.0, 60.0, 84.0, 130.0, 227.0, 407.0, 961.0, 2310.0, 7732.0, 36116.0, 321894.0, 2139542.0, 1480306.0, 172600.0, 22670.0, 5502.0, 1816.0, 723.0, 380.0, 201.0, 113.0, 78.0, 57.0, 39.0, 30.0, 22.0, 23.0, 19.0, 13.0, 10.0, 7.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.5, -7.2908935546875, -7.081787109375, -6.8726806640625, -6.66357421875, -6.4544677734375, -6.245361328125, -6.0362548828125, -5.8271484375, -5.6180419921875, -5.408935546875, -5.1998291015625, -4.99072265625, -4.7816162109375, -4.572509765625, -4.3634033203125, -4.154296875, -3.9451904296875, -3.736083984375, -3.5269775390625, -3.31787109375, -3.1087646484375, -2.899658203125, -2.6905517578125, -2.4814453125, -2.2723388671875, -2.063232421875, -1.8541259765625, -1.64501953125, -1.4359130859375, -1.226806640625, -1.0177001953125, -0.80859375, -0.5994873046875, -0.390380859375, -0.1812744140625, 0.02783203125, 0.2369384765625, 0.446044921875, 0.6551513671875, 0.8642578125, 1.0733642578125, 1.282470703125, 1.4915771484375, 1.70068359375, 1.9097900390625, 2.118896484375, 2.3280029296875, 2.537109375, 2.7462158203125, 2.955322265625, 3.1644287109375, 3.37353515625, 3.5826416015625, 3.791748046875, 4.0008544921875, 4.2099609375, 4.4190673828125, 4.628173828125, 4.8372802734375, 5.04638671875, 5.2554931640625, 5.464599609375, 5.6737060546875, 5.8828125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 29.0, 72.0, 248.0, 897.0, 1815.0, 740.0, 199.0, 55.0, 16.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.171875, -25.4130859375, -24.654296875, -23.8955078125, -23.13671875, -22.3779296875, -21.619140625, -20.8603515625, -20.1015625, -19.3427734375, -18.583984375, -17.8251953125, -17.06640625, -16.3076171875, -15.548828125, -14.7900390625, -14.03125, -13.2724609375, -12.513671875, -11.7548828125, -10.99609375, -10.2373046875, -9.478515625, -8.7197265625, -7.9609375, -7.2021484375, -6.443359375, -5.6845703125, -4.92578125, -4.1669921875, -3.408203125, -2.6494140625, -1.890625, -1.1318359375, -0.373046875, 0.3857421875, 1.14453125, 1.9033203125, 2.662109375, 3.4208984375, 4.1796875, 4.9384765625, 5.697265625, 6.4560546875, 7.21484375, 7.9736328125, 8.732421875, 9.4912109375, 10.25, 11.0087890625, 11.767578125, 12.5263671875, 13.28515625, 14.0439453125, 14.802734375, 15.5615234375, 16.3203125, 17.0791015625, 17.837890625, 18.5966796875, 19.35546875, 20.1142578125, 20.873046875, 21.6318359375, 22.390625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 7.0, 11.0, 29.0, 52.0, 249.0, 1423.0, 499517.0, 3690395.0, 2057.0, 400.0, 93.0, 25.0, 12.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.46875, -47.82373046875, -46.1787109375, -44.53369140625, -42.888671875, -41.24365234375, -39.5986328125, -37.95361328125, -36.30859375, -34.66357421875, -33.0185546875, -31.37353515625, -29.728515625, -28.08349609375, -26.4384765625, -24.79345703125, -23.1484375, -21.50341796875, -19.8583984375, -18.21337890625, -16.568359375, -14.92333984375, -13.2783203125, -11.63330078125, -9.98828125, -8.34326171875, -6.6982421875, -5.05322265625, -3.408203125, -1.76318359375, -0.1181640625, 1.52685546875, 3.171875, 4.81689453125, 6.4619140625, 8.10693359375, 9.751953125, 11.39697265625, 13.0419921875, 14.68701171875, 16.33203125, 17.97705078125, 19.6220703125, 21.26708984375, 22.912109375, 24.55712890625, 26.2021484375, 27.84716796875, 29.4921875, 31.13720703125, 32.7822265625, 34.42724609375, 36.072265625, 37.71728515625, 39.3623046875, 41.00732421875, 42.65234375, 44.29736328125, 45.9423828125, 47.58740234375, 49.232421875, 50.87744140625, 52.5224609375, 54.16748046875, 55.8125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 31.0, 164.0, 473.0, 279.0, 51.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.59152221679688, -101.88837432861328, -99.18522644042969, -96.4820785522461, -93.7789306640625, -91.0757827758789, -88.37263488769531, -85.66949462890625, -82.96633911132812, -80.26319122314453, -77.56004333496094, -74.85689544677734, -72.15374755859375, -69.45059967041016, -66.74745178222656, -64.0443115234375, -61.341163635253906, -58.63801574707031, -55.93486785888672, -53.231719970703125, -50.52857208251953, -47.82542419433594, -45.12228012084961, -42.419132232666016, -39.71598434448242, -37.01283645629883, -34.309688568115234, -31.606542587280273, -28.90339469909668, -26.200246810913086, -23.497100830078125, -20.79395294189453, -18.090805053710938, -15.387657165527344, -12.684510231018066, -9.981363296508789, -7.278215408325195, -4.575067520141602, -1.8719215393066406, 0.8312263488769531, 3.534374237060547, 6.237521648406982, 8.940669059753418, 11.643815994262695, 14.346963882446289, 17.050111770629883, 19.753257751464844, 22.456405639648438, 25.15955352783203, 27.862701416015625, 30.56584930419922, 33.26899719238281, 35.972145080566406, 38.67529296875, 41.37843704223633, 44.08158493041992, 46.784732818603516, 49.48788070678711, 52.1910285949707, 54.89417266845703, 57.597320556640625, 60.30046844482422, 63.00361633300781, 65.7067642211914, 68.409912109375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 17.0, 10.0, 8.0, 10.0, 14.0, 17.0, 22.0, 14.0, 27.0, 19.0, 29.0, 29.0, 43.0, 37.0, 32.0, 47.0, 40.0, 45.0, 27.0, 49.0, 25.0, 33.0, 38.0, 33.0, 42.0, 28.0, 29.0, 32.0, 22.0, 24.0, 25.0, 25.0, 21.0, 19.0, 11.0, 14.0, 6.0, 7.0, 2.0, 4.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.871299743652344, -25.081384658813477, -24.291467666625977, -23.50155258178711, -22.711637496948242, -21.921722412109375, -21.131805419921875, -20.341890335083008, -19.55197525024414, -18.762060165405273, -17.972143173217773, -17.182228088378906, -16.39231300354004, -15.602396965026855, -14.812480926513672, -14.022565841674805, -13.232648849487305, -12.442732810974121, -11.652817726135254, -10.86290168762207, -10.072986602783203, -9.28307056427002, -8.493154525756836, -7.7032389640808105, -6.913323402404785, -6.12340784072876, -5.333492279052734, -4.543576240539551, -3.7536606788635254, -2.9637451171875, -2.1738290786743164, -1.383913516998291, -0.5939960479736328, 0.19591963291168213, 0.9858353137969971, 1.7757511138916016, 2.565666675567627, 3.3555822372436523, 4.145498275756836, 4.935413837432861, 5.725329399108887, 6.515244960784912, 7.3051605224609375, 8.095076560974121, 8.884992599487305, 9.674907684326172, 10.464823722839355, 11.254739761352539, 12.044654846191406, 12.83457088470459, 13.624485969543457, 14.41440200805664, 15.204317092895508, 15.994233131408691, 16.784149169921875, 17.574064254760742, 18.36397933959961, 19.153894424438477, 19.943811416625977, 20.733726501464844, 21.52364158630371, 22.313556671142578, 23.103473663330078, 23.893388748168945, 24.683305740356445]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 3.0, 8.0, 5.0, 8.0, 7.0, 7.0, 10.0, 11.0, 15.0, 18.0, 21.0, 17.0, 15.0, 20.0, 23.0, 21.0, 26.0, 26.0, 38.0, 30.0, 23.0, 40.0, 30.0, 31.0, 36.0, 45.0, 39.0, 38.0, 41.0, 42.0, 27.0, 40.0, 33.0, 28.0, 29.0, 24.0, 21.0, 18.0, 14.0, 23.0, 10.0, 10.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8910675048828125, -1.820220947265625, -1.7493743896484375, -1.67852783203125, -1.6076812744140625, -1.536834716796875, -1.4659881591796875, -1.3951416015625, -1.3242950439453125, -1.253448486328125, -1.1826019287109375, -1.11175537109375, -1.0409088134765625, -0.970062255859375, -0.8992156982421875, -0.828369140625, -0.7575225830078125, -0.686676025390625, -0.6158294677734375, -0.54498291015625, -0.4741363525390625, -0.403289794921875, -0.3324432373046875, -0.2615966796875, -0.1907501220703125, -0.119903564453125, -0.0490570068359375, 0.02178955078125, 0.0926361083984375, 0.163482666015625, 0.2343292236328125, 0.30517578125, 0.3760223388671875, 0.446868896484375, 0.5177154541015625, 0.58856201171875, 0.6594085693359375, 0.730255126953125, 0.8011016845703125, 0.8719482421875, 0.9427947998046875, 1.013641357421875, 1.0844879150390625, 1.15533447265625, 1.2261810302734375, 1.297027587890625, 1.3678741455078125, 1.438720703125, 1.5095672607421875, 1.580413818359375, 1.6512603759765625, 1.72210693359375, 1.7929534912109375, 1.863800048828125, 1.9346466064453125, 2.0054931640625, 2.0763397216796875, 2.147186279296875, 2.2180328369140625, 2.28887939453125, 2.3597259521484375, 2.430572509765625, 2.5014190673828125, 2.572265625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 5.0, 8.0, 15.0, 18.0, 21.0, 33.0, 42.0, 58.0, 104.0, 181.0, 254.0, 387.0, 573.0, 906.0, 1395.0, 2247.0, 3391.0, 5445.0, 8370.0, 13051.0, 20726.0, 33074.0, 56067.0, 100223.0, 200746.0, 279901.0, 136057.0, 72586.0, 42062.0, 25483.0, 16397.0, 10226.0, 6570.0, 4330.0, 2733.0, 1741.0, 1100.0, 726.0, 462.0, 288.0, 195.0, 114.0, 80.0, 50.0, 42.0, 31.0, 20.0, 7.0, 6.0, 6.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.401611328125, -0.3873863220214844, -0.37316131591796875, -0.3589363098144531, -0.3447113037109375, -0.3304862976074219, -0.31626129150390625, -0.3020362854003906, -0.287811279296875, -0.2735862731933594, -0.25936126708984375, -0.24513626098632812, -0.2309112548828125, -0.21668624877929688, -0.20246124267578125, -0.18823623657226562, -0.17401123046875, -0.15978622436523438, -0.14556121826171875, -0.13133621215820312, -0.1171112060546875, -0.10288619995117188, -0.08866119384765625, -0.07443618774414062, -0.060211181640625, -0.045986175537109375, -0.03176116943359375, -0.017536163330078125, -0.0033111572265625, 0.010913848876953125, 0.02513885498046875, 0.039363861083984375, 0.0535888671875, 0.06781387329101562, 0.08203887939453125, 0.09626388549804688, 0.1104888916015625, 0.12471389770507812, 0.13893890380859375, 0.15316390991210938, 0.167388916015625, 0.18161392211914062, 0.19583892822265625, 0.21006393432617188, 0.2242889404296875, 0.23851394653320312, 0.25273895263671875, 0.2669639587402344, 0.28118896484375, 0.2954139709472656, 0.30963897705078125, 0.3238639831542969, 0.3380889892578125, 0.3523139953613281, 0.36653900146484375, 0.3807640075683594, 0.394989013671875, 0.4092140197753906, 0.42343902587890625, 0.4376640319824219, 0.4518890380859375, 0.4661140441894531, 0.48033905029296875, 0.4945640563964844, 0.5087890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 2.0, 3.0, 9.0, 7.0, 10.0, 12.0, 15.0, 21.0, 12.0, 13.0, 31.0, 19.0, 22.0, 30.0, 29.0, 41.0, 38.0, 41.0, 48.0, 38.0, 35.0, 1066.0, 40.0, 33.0, 36.0, 47.0, 37.0, 34.0, 32.0, 30.0, 47.0, 13.0, 27.0, 21.0, 20.0, 14.0, 17.0, 8.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.65826416015625, -1.6065673828125, -1.55487060546875, -1.503173828125, -1.45147705078125, -1.3997802734375, -1.34808349609375, -1.29638671875, -1.24468994140625, -1.1929931640625, -1.14129638671875, -1.089599609375, -1.03790283203125, -0.9862060546875, -0.93450927734375, -0.8828125, -0.83111572265625, -0.7794189453125, -0.72772216796875, -0.676025390625, -0.62432861328125, -0.5726318359375, -0.52093505859375, -0.46923828125, -0.41754150390625, -0.3658447265625, -0.31414794921875, -0.262451171875, -0.21075439453125, -0.1590576171875, -0.10736083984375, -0.0556640625, -0.00396728515625, 0.0477294921875, 0.09942626953125, 0.151123046875, 0.20281982421875, 0.2545166015625, 0.30621337890625, 0.35791015625, 0.40960693359375, 0.4613037109375, 0.51300048828125, 0.564697265625, 0.61639404296875, 0.6680908203125, 0.71978759765625, 0.771484375, 0.82318115234375, 0.8748779296875, 0.92657470703125, 0.978271484375, 1.02996826171875, 1.0816650390625, 1.13336181640625, 1.18505859375, 1.23675537109375, 1.2884521484375, 1.34014892578125, 1.391845703125, 1.44354248046875, 1.4952392578125, 1.54693603515625, 1.5986328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 13.0, 14.0, 17.0, 27.0, 50.0, 74.0, 102.0, 170.0, 233.0, 377.0, 555.0, 820.0, 1297.0, 1940.0, 2870.0, 4491.0, 6925.0, 10835.0, 17182.0, 27605.0, 45995.0, 79319.0, 152250.0, 1350179.0, 174465.0, 87663.0, 49990.0, 29728.0, 18411.0, 11704.0, 7560.0, 4975.0, 3144.0, 2189.0, 1325.0, 908.0, 598.0, 387.0, 243.0, 177.0, 108.0, 91.0, 41.0, 27.0, 25.0, 14.0, 10.0, 6.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453857421875, -0.4399299621582031, -0.42600250244140625, -0.4120750427246094, -0.3981475830078125, -0.3842201232910156, -0.37029266357421875, -0.3563652038574219, -0.342437744140625, -0.3285102844238281, -0.31458282470703125, -0.3006553649902344, -0.2867279052734375, -0.2728004455566406, -0.25887298583984375, -0.24494552612304688, -0.23101806640625, -0.21709060668945312, -0.20316314697265625, -0.18923568725585938, -0.1753082275390625, -0.16138076782226562, -0.14745330810546875, -0.13352584838867188, -0.119598388671875, -0.10567092895507812, -0.09174346923828125, -0.07781600952148438, -0.0638885498046875, -0.049961090087890625, -0.03603363037109375, -0.022106170654296875, -0.0081787109375, 0.005748748779296875, 0.01967620849609375, 0.033603668212890625, 0.0475311279296875, 0.061458587646484375, 0.07538604736328125, 0.08931350708007812, 0.103240966796875, 0.11716842651367188, 0.13109588623046875, 0.14502334594726562, 0.1589508056640625, 0.17287826538085938, 0.18680572509765625, 0.20073318481445312, 0.21466064453125, 0.22858810424804688, 0.24251556396484375, 0.2564430236816406, 0.2703704833984375, 0.2842979431152344, 0.29822540283203125, 0.3121528625488281, 0.326080322265625, 0.3400077819824219, 0.35393524169921875, 0.3678627014160156, 0.3817901611328125, 0.3957176208496094, 0.40964508056640625, 0.4235725402832031, 0.4375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 4.0, 12.0, 12.0, 14.0, 12.0, 15.0, 19.0, 24.0, 25.0, 34.0, 38.0, 48.0, 46.0, 52.0, 47.0, 62.0, 59.0, 50.0, 52.0, 48.0, 54.0, 37.0, 32.0, 33.0, 28.0, 20.0, 19.0, 23.0, 13.0, 15.0, 5.0, 7.0, 2.0, 2.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00034356117248535156, -0.00033297762274742126, -0.00032239407300949097, -0.00031181052327156067, -0.00030122697353363037, -0.0002906434237957001, -0.0002800598740577698, -0.0002694763243198395, -0.0002588927745819092, -0.0002483092248439789, -0.00023772567510604858, -0.00022714212536811829, -0.000216558575630188, -0.0002059750258922577, -0.0001953914761543274, -0.0001848079264163971, -0.0001742243766784668, -0.0001636408269405365, -0.0001530572772026062, -0.0001424737274646759, -0.0001318901777267456, -0.00012130662798881531, -0.00011072307825088501, -0.00010013952851295471, -8.955597877502441e-05, -7.897242903709412e-05, -6.838887929916382e-05, -5.780532956123352e-05, -4.722177982330322e-05, -3.6638230085372925e-05, -2.6054680347442627e-05, -1.547113060951233e-05, -4.887580871582031e-06, 5.695968866348267e-06, 1.6279518604278564e-05, 2.6863068342208862e-05, 3.744661808013916e-05, 4.803016781806946e-05, 5.8613717555999756e-05, 6.919726729393005e-05, 7.978081703186035e-05, 9.036436676979065e-05, 0.00010094791650772095, 0.00011153146624565125, 0.00012211501598358154, 0.00013269856572151184, 0.00014328211545944214, 0.00015386566519737244, 0.00016444921493530273, 0.00017503276467323303, 0.00018561631441116333, 0.00019619986414909363, 0.00020678341388702393, 0.00021736696362495422, 0.00022795051336288452, 0.00023853406310081482, 0.0002491176128387451, 0.0002597011625766754, 0.0002702847123146057, 0.000280868262052536, 0.0002914518117904663, 0.0003020353615283966, 0.0003126189112663269, 0.0003232024610042572, 0.0003337860107421875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 10.0, 6.0, 6.0, 12.0, 10.0, 17.0, 30.0, 37.0, 62.0, 76.0, 113.0, 159.0, 254.0, 409.0, 831.0, 2641.0, 1037891.0, 3751.0, 911.0, 461.0, 262.0, 174.0, 119.0, 89.0, 45.0, 50.0, 39.0, 23.0, 15.0, 15.0, 11.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00811767578125, -0.007868289947509766, -0.007618904113769531, -0.007369518280029297, -0.0071201324462890625, -0.006870746612548828, -0.006621360778808594, -0.006371974945068359, -0.006122589111328125, -0.005873203277587891, -0.005623817443847656, -0.005374431610107422, -0.0051250457763671875, -0.004875659942626953, -0.004626274108886719, -0.004376888275146484, -0.00412750244140625, -0.0038781166076660156, -0.0036287307739257812, -0.003379344940185547, -0.0031299591064453125, -0.002880573272705078, -0.0026311874389648438, -0.0023818016052246094, -0.002132415771484375, -0.0018830299377441406, -0.0016336441040039062, -0.0013842582702636719, -0.0011348724365234375, -0.0008854866027832031, -0.0006361007690429688, -0.0003867149353027344, -0.0001373291015625, 0.00011205673217773438, 0.00036144256591796875, 0.0006108283996582031, 0.0008602142333984375, 0.0011096000671386719, 0.0013589859008789062, 0.0016083717346191406, 0.001857757568359375, 0.0021071434020996094, 0.0023565292358398438, 0.002605915069580078, 0.0028553009033203125, 0.003104686737060547, 0.0033540725708007812, 0.0036034584045410156, 0.00385284423828125, 0.004102230072021484, 0.004351615905761719, 0.004601001739501953, 0.0048503875732421875, 0.005099773406982422, 0.005349159240722656, 0.005598545074462891, 0.005847930908203125, 0.006097316741943359, 0.006346702575683594, 0.006596088409423828, 0.0068454742431640625, 0.007094860076904297, 0.007344245910644531, 0.007593631744384766, 0.007843017578125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 65.0, 553.0, 364.0, 27.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001295246183872223, -0.0012669855495914817, -0.0012387249153107405, -0.0012104642810299993, -0.001182203646749258, -0.0011539431288838387, -0.0011256824946030974, -0.0010974218603223562, -0.001069161226041615, -0.0010409005917608738, -0.0010126399574801326, -0.0009843793231993914, -0.0009561187471263111, -0.0009278581128455698, -0.0008995975367724895, -0.0008713369024917483, -0.0008430762682110071, -0.0008148156339302659, -0.0007865549996495247, -0.0007582944235764444, -0.0007300337892957032, -0.000701773155014962, -0.0006735125789418817, -0.0006452519446611404, -0.0006169913103803992, -0.000588730676099658, -0.0005604700418189168, -0.0005322094657458365, -0.0005039488314650953, -0.00047568819718435407, -0.0004474275920074433, -0.00041916698683053255, -0.0003909062943421304, -0.0003626456600613892, -0.00033438505488447845, -0.0003061244497075677, -0.0002778638154268265, -0.00024960318114608526, -0.0002213425759691745, -0.00019308195624034852, -0.00016482133651152253, -0.00013656071678269655, -0.00010830009705387056, -8.003947732504457e-05, -5.1778857596218586e-05, -2.35182378673926e-05, 4.742381861433387e-06, 3.300300159025937e-05, 6.126362131908536e-05, 8.952424104791135e-05, 0.00011778486077673733, 0.00014604548050556332, 0.0001743061002343893, 0.0002025667199632153, 0.00023082733969204128, 0.00025908794486895204, 0.00028734857914969325, 0.00031560921343043447, 0.0003438698186073452, 0.000372130423784256, 0.0004003910580649972, 0.0004286516923457384, 0.00045691229752264917, 0.0004851729026995599, 0.0005134335369803011]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 12.0, 11.0, 16.0, 12.0, 9.0, 13.0, 25.0, 22.0, 18.0, 26.0, 24.0, 27.0, 44.0, 43.0, 44.0, 40.0, 37.0, 37.0, 46.0, 37.0, 43.0, 52.0, 39.0, 43.0, 25.0, 33.0, 31.0, 25.0, 13.0, 20.0, 23.0, 16.0, 15.0, 12.0, 11.0, 15.0, 10.0, 6.0, 2.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00020182132720947266, -0.00019604898989200592, -0.00019027665257453918, -0.00018450431525707245, -0.0001787319779396057, -0.00017295964062213898, -0.00016718730330467224, -0.0001614149659872055, -0.00015564262866973877, -0.00014987029135227203, -0.0001440979540348053, -0.00013832561671733856, -0.00013255327939987183, -0.0001267809420824051, -0.00012100860476493835, -0.00011523626744747162, -0.00010946393013000488, -0.00010369159281253815, -9.791925549507141e-05, -9.214691817760468e-05, -8.637458086013794e-05, -8.06022435426712e-05, -7.482990622520447e-05, -6.905756890773773e-05, -6.3285231590271e-05, -5.751289427280426e-05, -5.1740556955337524e-05, -4.596821963787079e-05, -4.019588232040405e-05, -3.442354500293732e-05, -2.865120768547058e-05, -2.2878870368003845e-05, -1.710653305053711e-05, -1.1334195733070374e-05, -5.561858415603638e-06, 2.1047890186309814e-07, 5.982816219329834e-06, 1.175515353679657e-05, 1.7527490854263306e-05, 2.329982817173004e-05, 2.9072165489196777e-05, 3.484450280666351e-05, 4.061684012413025e-05, 4.6389177441596985e-05, 5.216151475906372e-05, 5.7933852076530457e-05, 6.370618939399719e-05, 6.947852671146393e-05, 7.525086402893066e-05, 8.10232013463974e-05, 8.679553866386414e-05, 9.256787598133087e-05, 9.834021329879761e-05, 0.00010411255061626434, 0.00010988488793373108, 0.00011565722525119781, 0.00012142956256866455, 0.0001272018998861313, 0.00013297423720359802, 0.00013874657452106476, 0.0001445189118385315, 0.00015029124915599823, 0.00015606358647346497, 0.0001618359237909317, 0.00016760826110839844]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 3.0, 8.0, 5.0, 8.0, 7.0, 7.0, 10.0, 11.0, 15.0, 18.0, 21.0, 17.0, 15.0, 20.0, 23.0, 21.0, 26.0, 26.0, 38.0, 30.0, 23.0, 40.0, 30.0, 31.0, 36.0, 45.0, 39.0, 38.0, 41.0, 42.0, 27.0, 40.0, 33.0, 28.0, 29.0, 23.0, 22.0, 18.0, 14.0, 23.0, 10.0, 10.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8910675048828125, -1.820220947265625, -1.7493743896484375, -1.67852783203125, -1.6076812744140625, -1.536834716796875, -1.4659881591796875, -1.3951416015625, -1.3242950439453125, -1.253448486328125, -1.1826019287109375, -1.11175537109375, -1.0409088134765625, -0.970062255859375, -0.8992156982421875, -0.828369140625, -0.7575225830078125, -0.686676025390625, -0.6158294677734375, -0.54498291015625, -0.4741363525390625, -0.403289794921875, -0.3324432373046875, -0.2615966796875, -0.1907501220703125, -0.119903564453125, -0.0490570068359375, 0.02178955078125, 0.0926361083984375, 0.163482666015625, 0.2343292236328125, 0.30517578125, 0.3760223388671875, 0.446868896484375, 0.5177154541015625, 0.58856201171875, 0.6594085693359375, 0.730255126953125, 0.8011016845703125, 0.8719482421875, 0.9427947998046875, 1.013641357421875, 1.0844879150390625, 1.15533447265625, 1.2261810302734375, 1.297027587890625, 1.3678741455078125, 1.438720703125, 1.5095672607421875, 1.580413818359375, 1.6512603759765625, 1.72210693359375, 1.7929534912109375, 1.863800048828125, 1.9346466064453125, 2.0054931640625, 2.0763397216796875, 2.147186279296875, 2.2180328369140625, 2.28887939453125, 2.3597259521484375, 2.430572509765625, 2.5014190673828125, 2.572265625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 12.0, 16.0, 15.0, 27.0, 26.0, 44.0, 44.0, 80.0, 91.0, 127.0, 158.0, 229.0, 329.0, 483.0, 742.0, 1207.0, 2095.0, 4212.0, 10528.0, 39074.0, 257153.0, 594055.0, 103101.0, 20357.0, 6787.0, 3014.0, 1612.0, 933.0, 553.0, 402.0, 271.0, 198.0, 149.0, 130.0, 84.0, 61.0, 46.0, 36.0, 20.0, 17.0, 12.0, 6.0, 5.0, 2.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.2557373046875, -4.105224609375, -3.9547119140625, -3.80419921875, -3.6536865234375, -3.503173828125, -3.3526611328125, -3.2021484375, -3.0516357421875, -2.901123046875, -2.7506103515625, -2.60009765625, -2.4495849609375, -2.299072265625, -2.1485595703125, -1.998046875, -1.8475341796875, -1.697021484375, -1.5465087890625, -1.39599609375, -1.2454833984375, -1.094970703125, -0.9444580078125, -0.7939453125, -0.6434326171875, -0.492919921875, -0.3424072265625, -0.19189453125, -0.0413818359375, 0.109130859375, 0.2596435546875, 0.41015625, 0.5606689453125, 0.711181640625, 0.8616943359375, 1.01220703125, 1.1627197265625, 1.313232421875, 1.4637451171875, 1.6142578125, 1.7647705078125, 1.915283203125, 2.0657958984375, 2.21630859375, 2.3668212890625, 2.517333984375, 2.6678466796875, 2.818359375, 2.9688720703125, 3.119384765625, 3.2698974609375, 3.42041015625, 3.5709228515625, 3.721435546875, 3.8719482421875, 4.0224609375, 4.1729736328125, 4.323486328125, 4.4739990234375, 4.62451171875, 4.7750244140625, 4.925537109375, 5.0760498046875, 5.2265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 9.0, 5.0, 13.0, 7.0, 13.0, 16.0, 18.0, 19.0, 33.0, 31.0, 36.0, 57.0, 42.0, 85.0, 158.0, 435.0, 1483.0, 155.0, 83.0, 63.0, 42.0, 44.0, 40.0, 31.0, 24.0, 22.0, 18.0, 12.0, 10.0, 8.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.1064453125, -8.822265625, -8.5380859375, -8.25390625, -7.9697265625, -7.685546875, -7.4013671875, -7.1171875, -6.8330078125, -6.548828125, -6.2646484375, -5.98046875, -5.6962890625, -5.412109375, -5.1279296875, -4.84375, -4.5595703125, -4.275390625, -3.9912109375, -3.70703125, -3.4228515625, -3.138671875, -2.8544921875, -2.5703125, -2.2861328125, -2.001953125, -1.7177734375, -1.43359375, -1.1494140625, -0.865234375, -0.5810546875, -0.296875, -0.0126953125, 0.271484375, 0.5556640625, 0.83984375, 1.1240234375, 1.408203125, 1.6923828125, 1.9765625, 2.2607421875, 2.544921875, 2.8291015625, 3.11328125, 3.3974609375, 3.681640625, 3.9658203125, 4.25, 4.5341796875, 4.818359375, 5.1025390625, 5.38671875, 5.6708984375, 5.955078125, 6.2392578125, 6.5234375, 6.8076171875, 7.091796875, 7.3759765625, 7.66015625, 7.9443359375, 8.228515625, 8.5126953125, 8.796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 5.0, 7.0, 14.0, 19.0, 23.0, 36.0, 36.0, 72.0, 82.0, 102.0, 169.0, 320.0, 570.0, 1422.0, 24516.0, 3110201.0, 5751.0, 1042.0, 414.0, 244.0, 175.0, 115.0, 91.0, 65.0, 48.0, 47.0, 27.0, 14.0, 13.0, 15.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.5625, -18.957763671875, -18.35302734375, -17.748291015625, -17.1435546875, -16.538818359375, -15.93408203125, -15.329345703125, -14.724609375, -14.119873046875, -13.51513671875, -12.910400390625, -12.3056640625, -11.700927734375, -11.09619140625, -10.491455078125, -9.88671875, -9.281982421875, -8.67724609375, -8.072509765625, -7.4677734375, -6.863037109375, -6.25830078125, -5.653564453125, -5.048828125, -4.444091796875, -3.83935546875, -3.234619140625, -2.6298828125, -2.025146484375, -1.42041015625, -0.815673828125, -0.2109375, 0.393798828125, 0.99853515625, 1.603271484375, 2.2080078125, 2.812744140625, 3.41748046875, 4.022216796875, 4.626953125, 5.231689453125, 5.83642578125, 6.441162109375, 7.0458984375, 7.650634765625, 8.25537109375, 8.860107421875, 9.46484375, 10.069580078125, 10.67431640625, 11.279052734375, 11.8837890625, 12.488525390625, 13.09326171875, 13.697998046875, 14.302734375, 14.907470703125, 15.51220703125, 16.116943359375, 16.7216796875, 17.326416015625, 17.93115234375, 18.535888671875, 19.140625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 47.0, 967.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-314.534912109375, -308.74957275390625, -302.9642333984375, -297.17889404296875, -291.3935546875, -285.60821533203125, -279.8228759765625, -274.0375671386719, -268.2522277832031, -262.4668884277344, -256.6815490722656, -250.89620971679688, -245.1108856201172, -239.32554626464844, -233.5402069091797, -227.75486755371094, -221.9695281982422, -216.18418884277344, -210.3988494873047, -204.613525390625, -198.82818603515625, -193.0428466796875, -187.25750732421875, -181.47216796875, -175.68682861328125, -169.9014892578125, -164.11614990234375, -158.330810546875, -152.5454864501953, -146.76014709472656, -140.9748077392578, -135.18946838378906, -129.40415954589844, -123.61882019042969, -117.83348846435547, -112.04814910888672, -106.2628173828125, -100.47747802734375, -94.692138671875, -88.90679931640625, -83.1214599609375, -77.33612060546875, -71.55078887939453, -65.76544952392578, -59.9801139831543, -54.19477844238281, -48.40943908691406, -42.62410354614258, -36.83877182006836, -31.053436279296875, -25.268098831176758, -19.48276138305664, -13.697425842285156, -7.912090301513672, -2.126750946044922, 3.6585845947265625, 9.443920135498047, 15.229256629943848, 21.01459312438965, 26.799930572509766, 32.58526611328125, 38.370601654052734, 44.155941009521484, 49.94127655029297, 55.72661209106445]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 4.0, 9.0, 4.0, 7.0, 7.0, 7.0, 7.0, 16.0, 13.0, 16.0, 18.0, 15.0, 21.0, 19.0, 30.0, 23.0, 26.0, 24.0, 32.0, 27.0, 42.0, 27.0, 33.0, 34.0, 34.0, 45.0, 36.0, 33.0, 30.0, 28.0, 37.0, 27.0, 27.0, 20.0, 21.0, 26.0, 19.0, 22.0, 13.0, 20.0, 10.0, 15.0, 12.0, 12.0, 10.0, 7.0, 10.0, 10.0, 5.0, 1.0, 6.0, 3.0, 1.0], "bins": [-18.782054901123047, -18.286327362060547, -17.790599822998047, -17.294872283935547, -16.799144744873047, -16.303417205810547, -15.80768871307373, -15.31196117401123, -14.816232681274414, -14.320505142211914, -13.824777603149414, -13.329050064086914, -12.833321571350098, -12.337594032287598, -11.841866493225098, -11.346138954162598, -10.850411415100098, -10.354683876037598, -9.858956336975098, -9.363227844238281, -8.867500305175781, -8.371772766113281, -7.876045227050781, -7.380317687988281, -6.884589672088623, -6.388862133026123, -5.893134117126465, -5.397406578063965, -4.901679039001465, -4.405951023101807, -3.9102234840393066, -3.4144957065582275, -2.918768882751465, -2.4230411052703857, -1.9273134469985962, -1.4315857887268066, -0.9358580112457275, -0.44013023376464844, 0.05559730529785156, 0.5513250827789307, 1.0470528602600098, 1.5427806377410889, 2.038508415222168, 2.534235954284668, 3.029963731765747, 3.525691509246826, 4.021419048309326, 4.517147064208984, 5.012874603271484, 5.508602142333984, 6.004330158233643, 6.500057697296143, 6.995785713195801, 7.491513252258301, 7.987240791320801, 8.4829683303833, 8.978696823120117, 9.474424362182617, 9.970151901245117, 10.465879440307617, 10.961607933044434, 11.457335472106934, 11.953063011169434, 12.448790550231934, 12.944518089294434]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 6.0, 3.0, 5.0, 13.0, 11.0, 11.0, 12.0, 13.0, 11.0, 18.0, 21.0, 19.0, 21.0, 19.0, 26.0, 27.0, 34.0, 32.0, 32.0, 40.0, 23.0, 39.0, 39.0, 38.0, 37.0, 33.0, 38.0, 37.0, 43.0, 38.0, 37.0, 27.0, 37.0, 21.0, 11.0, 18.0, 20.0, 15.0, 16.0, 14.0, 9.0, 9.0, 8.0, 5.0, 2.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.798828125, -2.714263916015625, -2.62969970703125, -2.545135498046875, -2.4605712890625, -2.376007080078125, -2.29144287109375, -2.206878662109375, -2.122314453125, -2.037750244140625, -1.95318603515625, -1.868621826171875, -1.7840576171875, -1.699493408203125, -1.61492919921875, -1.530364990234375, -1.44580078125, -1.361236572265625, -1.27667236328125, -1.192108154296875, -1.1075439453125, -1.022979736328125, -0.93841552734375, -0.853851318359375, -0.769287109375, -0.684722900390625, -0.60015869140625, -0.515594482421875, -0.4310302734375, -0.346466064453125, -0.26190185546875, -0.177337646484375, -0.0927734375, -0.008209228515625, 0.07635498046875, 0.160919189453125, 0.2454833984375, 0.330047607421875, 0.41461181640625, 0.499176025390625, 0.583740234375, 0.668304443359375, 0.75286865234375, 0.837432861328125, 0.9219970703125, 1.006561279296875, 1.09112548828125, 1.175689697265625, 1.26025390625, 1.344818115234375, 1.42938232421875, 1.513946533203125, 1.5985107421875, 1.683074951171875, 1.76763916015625, 1.852203369140625, 1.936767578125, 2.021331787109375, 2.10589599609375, 2.190460205078125, 2.2750244140625, 2.359588623046875, 2.44415283203125, 2.528717041015625, 2.61328125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 4.0, 5.0, 4.0, 7.0, 16.0, 6.0, 13.0, 17.0, 19.0, 37.0, 30.0, 49.0, 49.0, 61.0, 77.0, 108.0, 147.0, 146.0, 250.0, 331.0, 467.0, 706.0, 1121.0, 2488.0, 14065.0, 985587.0, 3105949.0, 73612.0, 4378.0, 1508.0, 869.0, 576.0, 410.0, 275.0, 222.0, 161.0, 111.0, 95.0, 61.0, 44.0, 40.0, 32.0, 19.0, 27.0, 20.0, 23.0, 8.0, 7.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.8671875, -13.436767578125, -13.00634765625, -12.575927734375, -12.1455078125, -11.715087890625, -11.28466796875, -10.854248046875, -10.423828125, -9.993408203125, -9.56298828125, -9.132568359375, -8.7021484375, -8.271728515625, -7.84130859375, -7.410888671875, -6.98046875, -6.550048828125, -6.11962890625, -5.689208984375, -5.2587890625, -4.828369140625, -4.39794921875, -3.967529296875, -3.537109375, -3.106689453125, -2.67626953125, -2.245849609375, -1.8154296875, -1.385009765625, -0.95458984375, -0.524169921875, -0.09375, 0.336669921875, 0.76708984375, 1.197509765625, 1.6279296875, 2.058349609375, 2.48876953125, 2.919189453125, 3.349609375, 3.780029296875, 4.21044921875, 4.640869140625, 5.0712890625, 5.501708984375, 5.93212890625, 6.362548828125, 6.79296875, 7.223388671875, 7.65380859375, 8.084228515625, 8.5146484375, 8.945068359375, 9.37548828125, 9.805908203125, 10.236328125, 10.666748046875, 11.09716796875, 11.527587890625, 11.9580078125, 12.388427734375, 12.81884765625, 13.249267578125, 13.6796875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 8.0, 21.0, 12.0, 39.0, 67.0, 114.0, 219.0, 343.0, 519.0, 692.0, 683.0, 498.0, 351.0, 208.0, 119.0, 55.0, 42.0, 33.0, 14.0, 9.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.24932861328125, -6.0181884765625, -5.78704833984375, -5.555908203125, -5.32476806640625, -5.0936279296875, -4.86248779296875, -4.63134765625, -4.40020751953125, -4.1690673828125, -3.93792724609375, -3.706787109375, -3.47564697265625, -3.2445068359375, -3.01336669921875, -2.7822265625, -2.55108642578125, -2.3199462890625, -2.08880615234375, -1.857666015625, -1.62652587890625, -1.3953857421875, -1.16424560546875, -0.93310546875, -0.70196533203125, -0.4708251953125, -0.23968505859375, -0.008544921875, 0.22259521484375, 0.4537353515625, 0.68487548828125, 0.916015625, 1.14715576171875, 1.3782958984375, 1.60943603515625, 1.840576171875, 2.07171630859375, 2.3028564453125, 2.53399658203125, 2.76513671875, 2.99627685546875, 3.2274169921875, 3.45855712890625, 3.689697265625, 3.92083740234375, 4.1519775390625, 4.38311767578125, 4.6142578125, 4.84539794921875, 5.0765380859375, 5.30767822265625, 5.538818359375, 5.76995849609375, 6.0010986328125, 6.23223876953125, 6.46337890625, 6.69451904296875, 6.9256591796875, 7.15679931640625, 7.387939453125, 7.61907958984375, 7.8502197265625, 8.08135986328125, 8.3125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 33.0, 78.0, 159.0, 337.0, 888.0, 2663.0, 12596.0, 203240.0, 3330440.0, 612939.0, 24824.0, 3969.0, 1261.0, 453.0, 176.0, 90.0, 40.0, 23.0, 14.0, 9.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.46893310546875, -9.1956787109375, -8.92242431640625, -8.649169921875, -8.37591552734375, -8.1026611328125, -7.82940673828125, -7.55615234375, -7.28289794921875, -7.0096435546875, -6.73638916015625, -6.463134765625, -6.18988037109375, -5.9166259765625, -5.64337158203125, -5.3701171875, -5.09686279296875, -4.8236083984375, -4.55035400390625, -4.277099609375, -4.00384521484375, -3.7305908203125, -3.45733642578125, -3.18408203125, -2.91082763671875, -2.6375732421875, -2.36431884765625, -2.091064453125, -1.81781005859375, -1.5445556640625, -1.27130126953125, -0.998046875, -0.72479248046875, -0.4515380859375, -0.17828369140625, 0.094970703125, 0.36822509765625, 0.6414794921875, 0.91473388671875, 1.18798828125, 1.46124267578125, 1.7344970703125, 2.00775146484375, 2.281005859375, 2.55426025390625, 2.8275146484375, 3.10076904296875, 3.3740234375, 3.64727783203125, 3.9205322265625, 4.19378662109375, 4.467041015625, 4.74029541015625, 5.0135498046875, 5.28680419921875, 5.56005859375, 5.83331298828125, 6.1065673828125, 6.37982177734375, 6.653076171875, 6.92633056640625, 7.1995849609375, 7.47283935546875, 7.74609375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 4.0, 12.0, 17.0, 20.0, 32.0, 39.0, 47.0, 77.0, 93.0, 81.0, 100.0, 99.0, 84.0, 74.0, 61.0, 55.0, 30.0, 27.0, 20.0, 10.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.791250228881836, -22.712310791015625, -21.63336944580078, -20.55443000793457, -19.475488662719727, -18.396549224853516, -17.317607879638672, -16.23866844177246, -15.159728050231934, -14.080787658691406, -13.001847267150879, -11.922906875610352, -10.84396743774414, -9.765026092529297, -8.686086654663086, -7.607146263122559, -6.528205871582031, -5.449265480041504, -4.370325088500977, -3.2913851737976074, -2.21244478225708, -1.1335043907165527, -0.054564476013183594, 1.0243759155273438, 2.103316307067871, 3.1822566986083984, 4.261197090148926, 5.340137004852295, 6.419077396392822, 7.49801778793335, 8.576957702636719, 9.655898094177246, 10.73483657836914, 11.813776969909668, 12.892717361450195, 13.971656799316406, 15.05059814453125, 16.12953758239746, 17.208477020263672, 18.287418365478516, 19.36635971069336, 20.44529914855957, 21.524240493774414, 22.603179931640625, 23.68212127685547, 24.76106071472168, 25.84000015258789, 26.918941497802734, 27.997880935668945, 29.076820373535156, 30.15576171875, 31.23470115661621, 32.31364059448242, 33.392581939697266, 34.47152328491211, 35.55046081542969, 36.62940216064453, 37.708343505859375, 38.78728103637695, 39.8662223815918, 40.94516372680664, 42.024105072021484, 43.10304260253906, 44.181983947753906, 45.26092529296875]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 3.0, 6.0, 7.0, 3.0, 7.0, 11.0, 14.0, 12.0, 16.0, 11.0, 22.0, 24.0, 24.0, 25.0, 31.0, 34.0, 29.0, 32.0, 42.0, 40.0, 36.0, 33.0, 31.0, 51.0, 31.0, 45.0, 43.0, 29.0, 32.0, 36.0, 32.0, 27.0, 28.0, 19.0, 21.0, 23.0, 14.0, 9.0, 13.0, 12.0, 14.0, 5.0, 4.0, 6.0, 3.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.31160545349121, -16.7670841217041, -16.222562789916992, -15.678041458129883, -15.133520126342773, -14.588998794555664, -14.044477462768555, -13.499956130981445, -12.955434799194336, -12.410913467407227, -11.866392135620117, -11.321870803833008, -10.777349472045898, -10.232828140258789, -9.68830680847168, -9.14378547668457, -8.599264144897461, -8.054742813110352, -7.510221481323242, -6.965700149536133, -6.421178817749023, -5.876657485961914, -5.332136154174805, -4.787614822387695, -4.243093490600586, -3.6985721588134766, -3.154050827026367, -2.609529495239258, -2.0650081634521484, -1.520486831665039, -0.9759654998779297, -0.4314441680908203, 0.11307525634765625, 0.6575965881347656, 1.202117919921875, 1.7466392517089844, 2.2911605834960938, 2.835681915283203, 3.3802032470703125, 3.924724578857422, 4.469245910644531, 5.013767242431641, 5.55828857421875, 6.102809906005859, 6.647331237792969, 7.191852569580078, 7.7363739013671875, 8.280895233154297, 8.825416564941406, 9.369937896728516, 9.914459228515625, 10.458980560302734, 11.003501892089844, 11.548023223876953, 12.092544555664062, 12.637065887451172, 13.181587219238281, 13.72610855102539, 14.2706298828125, 14.81515121459961, 15.359672546386719, 15.904193878173828, 16.448715209960938, 16.993236541748047, 17.537757873535156]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 4.0, 14.0, 11.0, 15.0, 18.0, 17.0, 15.0, 14.0, 29.0, 23.0, 33.0, 22.0, 45.0, 36.0, 29.0, 37.0, 45.0, 40.0, 57.0, 40.0, 31.0, 51.0, 58.0, 23.0, 32.0, 34.0, 30.0, 28.0, 19.0, 21.0, 28.0, 11.0, 13.0, 9.0, 7.0, 16.0, 4.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.921875, -26.943603515625, -25.96533203125, -24.987060546875, -24.0087890625, -23.030517578125, -22.05224609375, -21.073974609375, -20.095703125, -19.117431640625, -18.13916015625, -17.160888671875, -16.1826171875, -15.204345703125, -14.22607421875, -13.247802734375, -12.26953125, -11.291259765625, -10.31298828125, -9.334716796875, -8.3564453125, -7.378173828125, -6.39990234375, -5.421630859375, -4.443359375, -3.465087890625, -2.48681640625, -1.508544921875, -0.5302734375, 0.447998046875, 1.42626953125, 2.404541015625, 3.3828125, 4.361083984375, 5.33935546875, 6.317626953125, 7.2958984375, 8.274169921875, 9.25244140625, 10.230712890625, 11.208984375, 12.187255859375, 13.16552734375, 14.143798828125, 15.1220703125, 16.100341796875, 17.07861328125, 18.056884765625, 19.03515625, 20.013427734375, 20.99169921875, 21.969970703125, 22.9482421875, 23.926513671875, 24.90478515625, 25.883056640625, 26.861328125, 27.839599609375, 28.81787109375, 29.796142578125, 30.7744140625, 31.752685546875, 32.73095703125, 33.709228515625, 34.6875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 8.0, 14.0, 17.0, 28.0, 48.0, 66.0, 110.0, 165.0, 249.0, 463.0, 669.0, 922.0, 1391.0, 2345.0, 3662.0, 5468.0, 8726.0, 14063.0, 23602.0, 40258.0, 73807.0, 147554.0, 302451.0, 200865.0, 96261.0, 50466.0, 28794.0, 17190.0, 10479.0, 6676.0, 4060.0, 2702.0, 1822.0, 1092.0, 715.0, 499.0, 302.0, 179.0, 118.0, 87.0, 63.0, 28.0, 30.0, 23.0, 10.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.6990966796875, -5.519287109375, -5.3394775390625, -5.15966796875, -4.9798583984375, -4.800048828125, -4.6202392578125, -4.4404296875, -4.2606201171875, -4.080810546875, -3.9010009765625, -3.72119140625, -3.5413818359375, -3.361572265625, -3.1817626953125, -3.001953125, -2.8221435546875, -2.642333984375, -2.4625244140625, -2.28271484375, -2.1029052734375, -1.923095703125, -1.7432861328125, -1.5634765625, -1.3836669921875, -1.203857421875, -1.0240478515625, -0.84423828125, -0.6644287109375, -0.484619140625, -0.3048095703125, -0.125, 0.0548095703125, 0.234619140625, 0.4144287109375, 0.59423828125, 0.7740478515625, 0.953857421875, 1.1336669921875, 1.3134765625, 1.4932861328125, 1.673095703125, 1.8529052734375, 2.03271484375, 2.2125244140625, 2.392333984375, 2.5721435546875, 2.751953125, 2.9317626953125, 3.111572265625, 3.2913818359375, 3.47119140625, 3.6510009765625, 3.830810546875, 4.0106201171875, 4.1904296875, 4.3702392578125, 4.550048828125, 4.7298583984375, 4.90966796875, 5.0894775390625, 5.269287109375, 5.4490966796875, 5.62890625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 4.0, 11.0, 6.0, 4.0, 12.0, 17.0, 18.0, 21.0, 16.0, 22.0, 29.0, 29.0, 29.0, 34.0, 39.0, 34.0, 46.0, 33.0, 48.0, 1068.0, 49.0, 40.0, 43.0, 36.0, 43.0, 28.0, 34.0, 36.0, 29.0, 19.0, 25.0, 22.0, 17.0, 17.0, 13.0, 9.0, 6.0, 5.0, 7.0, 6.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.34375, -20.691650390625, -20.03955078125, -19.387451171875, -18.7353515625, -18.083251953125, -17.43115234375, -16.779052734375, -16.126953125, -15.474853515625, -14.82275390625, -14.170654296875, -13.5185546875, -12.866455078125, -12.21435546875, -11.562255859375, -10.91015625, -10.258056640625, -9.60595703125, -8.953857421875, -8.3017578125, -7.649658203125, -6.99755859375, -6.345458984375, -5.693359375, -5.041259765625, -4.38916015625, -3.737060546875, -3.0849609375, -2.432861328125, -1.78076171875, -1.128662109375, -0.4765625, 0.175537109375, 0.82763671875, 1.479736328125, 2.1318359375, 2.783935546875, 3.43603515625, 4.088134765625, 4.740234375, 5.392333984375, 6.04443359375, 6.696533203125, 7.3486328125, 8.000732421875, 8.65283203125, 9.304931640625, 9.95703125, 10.609130859375, 11.26123046875, 11.913330078125, 12.5654296875, 13.217529296875, 13.86962890625, 14.521728515625, 15.173828125, 15.825927734375, 16.47802734375, 17.130126953125, 17.7822265625, 18.434326171875, 19.08642578125, 19.738525390625, 20.390625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 16.0, 23.0, 35.0, 49.0, 55.0, 99.0, 162.0, 217.0, 321.0, 508.0, 687.0, 1065.0, 1579.0, 2322.0, 3660.0, 5395.0, 8166.0, 12834.0, 20597.0, 33534.0, 56769.0, 105535.0, 227770.0, 1324464.0, 123657.0, 66084.0, 37531.0, 22742.0, 14414.0, 9000.0, 5921.0, 3851.0, 2562.0, 1796.0, 1213.0, 833.0, 537.0, 368.0, 249.0, 176.0, 112.0, 69.0, 49.0, 29.0, 25.0, 18.0, 5.0, 10.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.78094482421875, -5.6009521484375, -5.42095947265625, -5.240966796875, -5.06097412109375, -4.8809814453125, -4.70098876953125, -4.52099609375, -4.34100341796875, -4.1610107421875, -3.98101806640625, -3.801025390625, -3.62103271484375, -3.4410400390625, -3.26104736328125, -3.0810546875, -2.90106201171875, -2.7210693359375, -2.54107666015625, -2.361083984375, -2.18109130859375, -2.0010986328125, -1.82110595703125, -1.64111328125, -1.46112060546875, -1.2811279296875, -1.10113525390625, -0.921142578125, -0.74114990234375, -0.5611572265625, -0.38116455078125, -0.201171875, -0.02117919921875, 0.1588134765625, 0.33880615234375, 0.518798828125, 0.69879150390625, 0.8787841796875, 1.05877685546875, 1.23876953125, 1.41876220703125, 1.5987548828125, 1.77874755859375, 1.958740234375, 2.13873291015625, 2.3187255859375, 2.49871826171875, 2.6787109375, 2.85870361328125, 3.0386962890625, 3.21868896484375, 3.398681640625, 3.57867431640625, 3.7586669921875, 3.93865966796875, 4.11865234375, 4.29864501953125, 4.4786376953125, 4.65863037109375, 4.838623046875, 5.01861572265625, 5.1986083984375, 5.37860107421875, 5.55859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 12.0, 17.0, 16.0, 26.0, 19.0, 35.0, 36.0, 45.0, 53.0, 52.0, 55.0, 64.0, 79.0, 77.0, 71.0, 51.0, 49.0, 42.0, 42.0, 27.0, 23.0, 21.0, 9.0, 12.0, 16.0, 10.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00528717041015625, -0.005140960216522217, -0.004994750022888184, -0.00484853982925415, -0.004702329635620117, -0.004556119441986084, -0.004409909248352051, -0.004263699054718018, -0.004117488861083984, -0.003971278667449951, -0.003825068473815918, -0.0036788582801818848, -0.0035326480865478516, -0.0033864378929138184, -0.003240227699279785, -0.003094017505645752, -0.0029478073120117188, -0.0028015971183776855, -0.0026553869247436523, -0.002509176731109619, -0.002362966537475586, -0.0022167563438415527, -0.0020705461502075195, -0.0019243359565734863, -0.0017781257629394531, -0.00163191556930542, -0.0014857053756713867, -0.0013394951820373535, -0.0011932849884033203, -0.0010470747947692871, -0.0009008646011352539, -0.0007546544075012207, -0.0006084442138671875, -0.0004622340202331543, -0.0003160238265991211, -0.0001698136329650879, -2.3603439331054688e-05, 0.00012260675430297852, 0.0002688169479370117, 0.0004150271415710449, 0.0005612373352050781, 0.0007074475288391113, 0.0008536577224731445, 0.0009998679161071777, 0.001146078109741211, 0.0012922883033752441, 0.0014384984970092773, 0.0015847086906433105, 0.0017309188842773438, 0.001877129077911377, 0.00202333927154541, 0.0021695494651794434, 0.0023157596588134766, 0.0024619698524475098, 0.002608180046081543, 0.002754390239715576, 0.0029006004333496094, 0.0030468106269836426, 0.0031930208206176758, 0.003339231014251709, 0.003485441207885742, 0.0036316514015197754, 0.0037778615951538086, 0.003924071788787842, 0.004070281982421875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 15.0, 14.0, 16.0, 22.0, 23.0, 31.0, 54.0, 72.0, 91.0, 126.0, 171.0, 321.0, 482.0, 872.0, 1811.0, 4464.0, 14140.0, 55196.0, 235312.0, 466138.0, 201889.0, 47090.0, 12188.0, 4105.0, 1719.0, 794.0, 490.0, 279.0, 197.0, 116.0, 91.0, 60.0, 41.0, 34.0, 18.0, 16.0, 16.0, 6.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0227508544921875, -0.021978139877319336, -0.021205425262451172, -0.020432710647583008, -0.019659996032714844, -0.01888728141784668, -0.018114566802978516, -0.01734185218811035, -0.016569137573242188, -0.015796422958374023, -0.01502370834350586, -0.014250993728637695, -0.013478279113769531, -0.012705564498901367, -0.011932849884033203, -0.011160135269165039, -0.010387420654296875, -0.009614706039428711, -0.008841991424560547, -0.008069276809692383, -0.007296562194824219, -0.006523847579956055, -0.005751132965087891, -0.0049784183502197266, -0.0042057037353515625, -0.0034329891204833984, -0.0026602745056152344, -0.0018875598907470703, -0.0011148452758789062, -0.0003421306610107422, 0.0004305839538574219, 0.001203298568725586, 0.00197601318359375, 0.002748727798461914, 0.003521442413330078, 0.004294157028198242, 0.005066871643066406, 0.00583958625793457, 0.006612300872802734, 0.0073850154876708984, 0.008157730102539062, 0.008930444717407227, 0.00970315933227539, 0.010475873947143555, 0.011248588562011719, 0.012021303176879883, 0.012794017791748047, 0.013566732406616211, 0.014339447021484375, 0.015112161636352539, 0.015884876251220703, 0.016657590866088867, 0.01743030548095703, 0.018203020095825195, 0.01897573471069336, 0.019748449325561523, 0.020521163940429688, 0.02129387855529785, 0.022066593170166016, 0.02283930778503418, 0.023612022399902344, 0.024384737014770508, 0.025157451629638672, 0.025930166244506836, 0.026702880859375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 11.0, 11.0, 19.0, 32.0, 48.0, 68.0, 94.0, 100.0, 120.0, 101.0, 109.0, 78.0, 64.0, 34.0, 40.0, 29.0, 21.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.005841652862727642, -0.00570902181789279, -0.005576390773057938, -0.005443759728223085, -0.005311128683388233, -0.005178498104214668, -0.005045866593718529, -0.004913236014544964, -0.004780604969710112, -0.004647973924875259, -0.004515342880040407, -0.004382711835205555, -0.004250080790370703, -0.0041174497455358505, -0.003984819166362286, -0.0038521878886967897, -0.0037195568438619375, -0.0035869257990270853, -0.003454294754192233, -0.0033216639421880245, -0.0031890328973531723, -0.00305640185251832, -0.002923770807683468, -0.0027911397628486156, -0.0026585087180137634, -0.002525877673178911, -0.002393246628344059, -0.0022606155835092068, -0.002127984771504998, -0.001995353726670146, -0.0018627226818352938, -0.0017300916370004416, -0.0015974610578268766, -0.0014648300129920244, -0.001332199084572494, -0.0011995680397376418, -0.0010669371113181114, -0.0009343060664832592, -0.000801675021648407, -0.0006690440350212157, -0.0005364130483940244, -0.00040378206176683307, -0.0002711510460358113, -0.00013852003030478954, -5.889043677598238e-06, 0.00012674194294959307, 0.0002593729877844453, 0.0003920039744116366, 0.0005246349610388279, 0.0006572659476660192, 0.0007898969342932105, 0.0009225279791280627, 0.0010551589075475931, 0.0011877899523824453, 0.0013204209972172976, 0.0014530520420521498, 0.0015856829704716802, 0.0017183140153065324, 0.0018509449437260628, 0.001983575988560915, 0.002116207033395767, 0.0022488380782306194, 0.0023814691230654716, 0.00251409993506968, 0.0026467309799045324]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 2.0, 9.0, 6.0, 9.0, 13.0, 16.0, 13.0, 24.0, 21.0, 23.0, 29.0, 29.0, 36.0, 23.0, 42.0, 51.0, 36.0, 40.0, 34.0, 28.0, 28.0, 42.0, 38.0, 40.0, 39.0, 31.0, 31.0, 29.0, 22.0, 36.0, 32.0, 19.0, 23.0, 14.0, 15.0, 14.0, 11.0, 13.0, 9.0, 8.0, 5.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.002259373664855957, -0.002196243032813072, -0.0021331124007701874, -0.0020699817687273026, -0.0020068511366844177, -0.001943720504641533, -0.001880589872598648, -0.0018174592405557632, -0.0017543286085128784, -0.0016911979764699936, -0.0016280673444271088, -0.001564936712384224, -0.0015018060803413391, -0.0014386754482984543, -0.0013755448162555695, -0.0013124141842126846, -0.0012492835521697998, -0.001186152920126915, -0.0011230222880840302, -0.0010598916560411453, -0.0009967610239982605, -0.0009336303919553757, -0.0008704997599124908, -0.000807369127869606, -0.0007442384958267212, -0.0006811078637838364, -0.0006179772317409515, -0.0005548465996980667, -0.0004917159676551819, -0.00042858533561229706, -0.00036545470356941223, -0.0003023240715265274, -0.00023919343948364258, -0.00017606280744075775, -0.00011293217539787292, -4.98015433549881e-05, 1.3329088687896729e-05, 7.645972073078156e-05, 0.00013959035277366638, 0.0002027209848165512, 0.00026585161685943604, 0.00032898224890232086, 0.0003921128809452057, 0.0004552435129880905, 0.0005183741450309753, 0.0005815047770738602, 0.000644635409116745, 0.0007077660411596298, 0.0007708966732025146, 0.0008340273052453995, 0.0008971579372882843, 0.0009602885693311691, 0.001023419201374054, 0.0010865498334169388, 0.0011496804654598236, 0.0012128110975027084, 0.0012759417295455933, 0.001339072361588478, 0.001402202993631363, 0.0014653336256742477, 0.0015284642577171326, 0.0015915948897600174, 0.0016547255218029022, 0.001717856153845787, 0.0017809867858886719]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 4.0, 14.0, 11.0, 15.0, 18.0, 17.0, 15.0, 14.0, 29.0, 23.0, 33.0, 22.0, 45.0, 36.0, 29.0, 36.0, 47.0, 39.0, 56.0, 41.0, 31.0, 52.0, 57.0, 23.0, 32.0, 34.0, 30.0, 28.0, 19.0, 21.0, 28.0, 11.0, 13.0, 9.0, 7.0, 16.0, 4.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.921875, -26.943603515625, -25.96533203125, -24.987060546875, -24.0087890625, -23.030517578125, -22.05224609375, -21.073974609375, -20.095703125, -19.117431640625, -18.13916015625, -17.160888671875, -16.1826171875, -15.204345703125, -14.22607421875, -13.247802734375, -12.26953125, -11.291259765625, -10.31298828125, -9.334716796875, -8.3564453125, -7.378173828125, -6.39990234375, -5.421630859375, -4.443359375, -3.465087890625, -2.48681640625, -1.508544921875, -0.5302734375, 0.447998046875, 1.42626953125, 2.404541015625, 3.3828125, 4.361083984375, 5.33935546875, 6.317626953125, 7.2958984375, 8.274169921875, 9.25244140625, 10.230712890625, 11.208984375, 12.187255859375, 13.16552734375, 14.143798828125, 15.1220703125, 16.100341796875, 17.07861328125, 18.056884765625, 19.03515625, 20.013427734375, 20.99169921875, 21.969970703125, 22.9482421875, 23.926513671875, 24.90478515625, 25.883056640625, 26.861328125, 27.839599609375, 28.81787109375, 29.796142578125, 30.7744140625, 31.752685546875, 32.73095703125, 33.709228515625, 34.6875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 5.0, 12.0, 14.0, 17.0, 22.0, 24.0, 34.0, 46.0, 76.0, 91.0, 145.0, 192.0, 310.0, 489.0, 731.0, 1219.0, 2363.0, 4613.0, 11635.0, 36784.0, 143490.0, 445502.0, 290560.0, 74457.0, 20669.0, 7377.0, 3242.0, 1744.0, 948.0, 546.0, 352.0, 269.0, 149.0, 113.0, 84.0, 48.0, 35.0, 38.0, 24.0, 12.0, 13.0, 17.0, 14.0, 12.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-5.7578125, -5.5872802734375, -5.416748046875, -5.2462158203125, -5.07568359375, -4.9051513671875, -4.734619140625, -4.5640869140625, -4.3935546875, -4.2230224609375, -4.052490234375, -3.8819580078125, -3.71142578125, -3.5408935546875, -3.370361328125, -3.1998291015625, -3.029296875, -2.8587646484375, -2.688232421875, -2.5177001953125, -2.34716796875, -2.1766357421875, -2.006103515625, -1.8355712890625, -1.6650390625, -1.4945068359375, -1.323974609375, -1.1534423828125, -0.98291015625, -0.8123779296875, -0.641845703125, -0.4713134765625, -0.30078125, -0.1302490234375, 0.040283203125, 0.2108154296875, 0.38134765625, 0.5518798828125, 0.722412109375, 0.8929443359375, 1.0634765625, 1.2340087890625, 1.404541015625, 1.5750732421875, 1.74560546875, 1.9161376953125, 2.086669921875, 2.2572021484375, 2.427734375, 2.5982666015625, 2.768798828125, 2.9393310546875, 3.10986328125, 3.2803955078125, 3.450927734375, 3.6214599609375, 3.7919921875, 3.9625244140625, 4.133056640625, 4.3035888671875, 4.47412109375, 4.6446533203125, 4.815185546875, 4.9857177734375, 5.15625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 6.0, 11.0, 14.0, 8.0, 14.0, 23.0, 29.0, 33.0, 52.0, 59.0, 58.0, 79.0, 83.0, 2109.0, 86.0, 59.0, 57.0, 57.0, 44.0, 35.0, 26.0, 25.0, 25.0, 15.0, 10.0, 9.0, 6.0, 13.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-77.3125, -75.005859375, -72.69921875, -70.392578125, -68.0859375, -65.779296875, -63.47265625, -61.166015625, -58.859375, -56.552734375, -54.24609375, -51.939453125, -49.6328125, -47.326171875, -45.01953125, -42.712890625, -40.40625, -38.099609375, -35.79296875, -33.486328125, -31.1796875, -28.873046875, -26.56640625, -24.259765625, -21.953125, -19.646484375, -17.33984375, -15.033203125, -12.7265625, -10.419921875, -8.11328125, -5.806640625, -3.5, -1.193359375, 1.11328125, 3.419921875, 5.7265625, 8.033203125, 10.33984375, 12.646484375, 14.953125, 17.259765625, 19.56640625, 21.873046875, 24.1796875, 26.486328125, 28.79296875, 31.099609375, 33.40625, 35.712890625, 38.01953125, 40.326171875, 42.6328125, 44.939453125, 47.24609375, 49.552734375, 51.859375, 54.166015625, 56.47265625, 58.779296875, 61.0859375, 63.392578125, 65.69921875, 68.005859375, 70.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 4.0, 8.0, 10.0, 15.0, 24.0, 28.0, 37.0, 42.0, 70.0, 100.0, 112.0, 213.0, 276.0, 383.0, 690.0, 1203.0, 2927.0, 13283.0, 159533.0, 2840473.0, 110032.0, 10586.0, 2629.0, 1151.0, 610.0, 364.0, 275.0, 155.0, 129.0, 95.0, 66.0, 41.0, 35.0, 25.0, 16.0, 20.0, 7.0, 7.0, 6.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.015625, -9.6865234375, -9.357421875, -9.0283203125, -8.69921875, -8.3701171875, -8.041015625, -7.7119140625, -7.3828125, -7.0537109375, -6.724609375, -6.3955078125, -6.06640625, -5.7373046875, -5.408203125, -5.0791015625, -4.75, -4.4208984375, -4.091796875, -3.7626953125, -3.43359375, -3.1044921875, -2.775390625, -2.4462890625, -2.1171875, -1.7880859375, -1.458984375, -1.1298828125, -0.80078125, -0.4716796875, -0.142578125, 0.1865234375, 0.515625, 0.8447265625, 1.173828125, 1.5029296875, 1.83203125, 2.1611328125, 2.490234375, 2.8193359375, 3.1484375, 3.4775390625, 3.806640625, 4.1357421875, 4.46484375, 4.7939453125, 5.123046875, 5.4521484375, 5.78125, 6.1103515625, 6.439453125, 6.7685546875, 7.09765625, 7.4267578125, 7.755859375, 8.0849609375, 8.4140625, 8.7431640625, 9.072265625, 9.4013671875, 9.73046875, 10.0595703125, 10.388671875, 10.7177734375, 11.046875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 14.0, 39.0, 76.0, 174.0, 246.0, 193.0, 118.0, 53.0, 28.0, 10.0, 9.0, 11.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.93960571289062, -114.4190902709961, -110.89857482910156, -107.37805938720703, -103.8575439453125, -100.33702850341797, -96.81651306152344, -93.2959976196289, -89.77548217773438, -86.25496673583984, -82.73445129394531, -79.21393585205078, -75.69342041015625, -72.17290496826172, -68.65238952636719, -65.13187408447266, -61.611358642578125, -58.090843200683594, -54.57032775878906, -51.04981231689453, -47.529296875, -44.00878143310547, -40.48826599121094, -36.967750549316406, -33.447235107421875, -29.926719665527344, -26.406204223632812, -22.88568878173828, -19.36517333984375, -15.844657897949219, -12.324142456054688, -8.803627014160156, -5.283103942871094, -1.7625885009765625, 1.7579269409179688, 5.2784423828125, 8.798957824707031, 12.319473266601562, 15.839988708496094, 19.360504150390625, 22.881019592285156, 26.401535034179688, 29.92205047607422, 33.44256591796875, 36.96308135986328, 40.48359680175781, 44.004112243652344, 47.524627685546875, 51.045143127441406, 54.56565856933594, 58.08617401123047, 61.606689453125, 65.12720489501953, 68.64772033691406, 72.1682357788086, 75.68875122070312, 79.20926666259766, 82.72978210449219, 86.25029754638672, 89.77081298828125, 93.29132843017578, 96.81184387207031, 100.33235931396484, 103.85287475585938, 107.3733901977539]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 4.0, 12.0, 7.0, 12.0, 21.0, 14.0, 18.0, 30.0, 34.0, 32.0, 23.0, 50.0, 39.0, 38.0, 48.0, 49.0, 59.0, 40.0, 48.0, 55.0, 44.0, 45.0, 41.0, 33.0, 37.0, 36.0, 22.0, 25.0, 21.0, 10.0, 12.0, 6.0, 6.0, 9.0, 6.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.462646484375, -57.190391540527344, -54.91813659667969, -52.6458854675293, -50.37363052368164, -48.101375579833984, -45.829124450683594, -43.55686950683594, -41.28461456298828, -39.012359619140625, -36.74010467529297, -34.46785354614258, -32.19559860229492, -29.923343658447266, -27.651090621948242, -25.37883758544922, -23.106582641601562, -20.834327697753906, -18.562074661254883, -16.28982162475586, -14.017566680908203, -11.745312690734863, -9.473058700561523, -7.200804710388184, -4.928550720214844, -2.656296730041504, -0.38404273986816406, 1.8882112503051758, 4.160465240478516, 6.4327192306518555, 8.704973220825195, 10.977227210998535, 13.249481201171875, 15.521735191345215, 17.793989181518555, 20.066242218017578, 22.338497161865234, 24.61075210571289, 26.883005142211914, 29.155258178710938, 31.427513122558594, 33.69976806640625, 35.972023010253906, 38.2442741394043, 40.51652908325195, 42.78878402709961, 45.06103515625, 47.333290100097656, 49.60554504394531, 51.87779998779297, 54.150054931640625, 56.422306060791016, 58.69456100463867, 60.96681594848633, 63.23906707763672, 65.51132202148438, 67.78357696533203, 70.05583190917969, 72.32808685302734, 74.600341796875, 76.87258911132812, 79.14484405517578, 81.41709899902344, 83.6893539428711, 85.96160888671875]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 11.0, 9.0, 16.0, 17.0, 18.0, 22.0, 40.0, 60.0, 81.0, 132.0, 166.0, 237.0, 369.0, 577.0, 812.0, 1174.0, 1797.0, 2694.0, 3717.0, 5189.0, 1006721.0, 7955.0, 5121.0, 3672.0, 2548.0, 1716.0, 1237.0, 764.0, 517.0, 348.0, 219.0, 173.0, 105.0, 90.0, 51.0, 48.0, 39.0, 21.0, 24.0, 11.0, 4.0, 7.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.675667762756348, -11.31039047241211, -10.945112228393555, -10.579834938049316, -10.214557647705078, -9.849279403686523, -9.484002113342285, -9.118724822998047, -8.753446578979492, -8.388169288635254, -8.0228910446167, -7.657613754272461, -7.2923359870910645, -6.927058219909668, -6.56178092956543, -6.196503162384033, -5.831225395202637, -5.46594762802124, -5.100669860839844, -4.7353925704956055, -4.370114803314209, -4.0048370361328125, -3.639559507369995, -3.2742819786071777, -2.9090042114257812, -2.5437264442443848, -2.1784489154815674, -1.8131712675094604, -1.4478936195373535, -1.0826159715652466, -0.7173383235931396, -0.35206079483032227, 0.013217926025390625, 0.37849557399749756, 0.7437732219696045, 1.1090508699417114, 1.4743285179138184, 1.8396061658859253, 2.2048838138580322, 2.5701613426208496, 2.935439109802246, 3.3007168769836426, 3.66599440574646, 4.031271934509277, 4.396549701690674, 4.76182746887207, 5.127104759216309, 5.492382526397705, 5.857660293579102, 6.222938060760498, 6.5882158279418945, 6.953493118286133, 7.318770885467529, 7.684048652648926, 8.049325942993164, 8.414604187011719, 8.779881477355957, 9.145158767700195, 9.51043701171875, 9.875714302062988, 10.240991592407227, 10.606269836425781, 10.97154712677002, 11.336824417114258, 11.702102661132812]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 10.0, 12.0, 27.0, 52.0, 124.0, 158.0, 10998.0, 51452148.0, 182.0, 66.0, 58.0, 57.0, 31.0, 26.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5163.12060546875, -5030.8798828125, -4898.63916015625, -4766.39794921875, -4634.1572265625, -4501.91650390625, -4369.67578125, -4237.4345703125, -4105.19384765625, -3972.953125, -3840.712158203125, -3708.471435546875, -3576.23046875, -3443.98974609375, -3311.7490234375, -3179.508056640625, -3047.267333984375, -2915.026611328125, -2782.78564453125, -2650.544921875, -2518.303955078125, -2386.063232421875, -2253.822265625, -2121.58154296875, -1989.3406982421875, -1857.099853515625, -1724.8590087890625, -1592.6181640625, -1460.37744140625, -1328.136474609375, -1195.895751953125, -1063.6549072265625, -931.414306640625, -799.1734619140625, -666.9326171875, -534.6918334960938, -402.45098876953125, -270.21014404296875, -137.9693603515625, -5.728515625, 126.5123291015625, 258.753173828125, 390.9939880371094, 523.2348022460938, 655.4756469726562, 787.7164916992188, 919.957275390625, 1052.1981201171875, 1184.43896484375, 1316.6798095703125, 1448.920654296875, 1581.161376953125, 1713.40234375, 1845.64306640625, 1977.8839111328125, 2110.124755859375, 2242.36572265625, 2374.6064453125, 2506.847412109375, 2639.088134765625, 2771.3291015625, 2903.56982421875, 3035.810546875, 3168.051513671875, 3300.292236328125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [8.0, 4.0, 10.0, 15.0, 5.0, 21.0, 39.0, 59.0, 57.0, 110.0, 148.0, 231.0, 354.0, 476.0, 572.0, 768.0, 1119.0, 1700.0, 2510.0, 3661.0, 5277.0, 7544.0, 11175.0, 16182.0, 24880.0, 37421.0, 58824.0, 92086.0, 151729.0, 264004.0, 613418.0, 3900479.0, 481774.0, 233173.0, 137599.0, 84448.0, 54087.0, 34462.0, 22789.0, 14861.0, 10542.0, 6893.0, 4675.0, 3500.0, 2409.0, 1515.0, 1135.0, 811.0, 574.0, 405.0, 303.0, 198.0, 134.0, 80.0, 61.0, 33.0, 29.0, 28.0, 20.0, 11.0, 12.0, 3.0, 1.0, 5.0], "bins": [-2.548828125, -2.4676513671875, -2.386474609375, -2.3052978515625, -2.22412109375, -2.1429443359375, -2.061767578125, -1.9805908203125, -1.8994140625, -1.8182373046875, -1.737060546875, -1.6558837890625, -1.57470703125, -1.4935302734375, -1.412353515625, -1.3311767578125, -1.25, -1.1688232421875, -1.087646484375, -1.0064697265625, -0.92529296875, -0.8441162109375, -0.762939453125, -0.6817626953125, -0.6005859375, -0.5194091796875, -0.438232421875, -0.3570556640625, -0.27587890625, -0.1947021484375, -0.113525390625, -0.0323486328125, 0.048828125, 0.1300048828125, 0.211181640625, 0.2923583984375, 0.37353515625, 0.4547119140625, 0.535888671875, 0.6170654296875, 0.6982421875, 0.7794189453125, 0.860595703125, 0.9417724609375, 1.02294921875, 1.1041259765625, 1.185302734375, 1.2664794921875, 1.34765625, 1.4288330078125, 1.510009765625, 1.5911865234375, 1.67236328125, 1.7535400390625, 1.834716796875, 1.9158935546875, 1.9970703125, 2.0782470703125, 2.159423828125, 2.2406005859375, 2.32177734375, 2.4029541015625, 2.484130859375, 2.5653076171875, 2.646484375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 3.0, 9.0, 9.0, 7.0, 14.0, 14.0, 20.0, 26.0, 29.0, 34.0, 37.0, 34.0, 35.0, 43.0, 40.0, 42.0, 81.0, 366.0, 580.0, 124.0, 53.0, 54.0, 43.0, 38.0, 26.0, 32.0, 34.0, 21.0, 27.0, 29.0, 13.0, 15.0, 18.0, 12.0, 5.0, 7.0, 8.0, 7.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.66534423828125, -6.4439697265625, -6.22259521484375, -6.001220703125, -5.77984619140625, -5.5584716796875, -5.33709716796875, -5.11572265625, -4.89434814453125, -4.6729736328125, -4.45159912109375, -4.230224609375, -4.00885009765625, -3.7874755859375, -3.56610107421875, -3.3447265625, -3.12335205078125, -2.9019775390625, -2.68060302734375, -2.459228515625, -2.23785400390625, -2.0164794921875, -1.79510498046875, -1.57373046875, -1.35235595703125, -1.1309814453125, -0.90960693359375, -0.688232421875, -0.46685791015625, -0.2454833984375, -0.02410888671875, 0.197265625, 0.41864013671875, 0.6400146484375, 0.86138916015625, 1.082763671875, 1.30413818359375, 1.5255126953125, 1.74688720703125, 1.96826171875, 2.18963623046875, 2.4110107421875, 2.63238525390625, 2.853759765625, 3.07513427734375, 3.2965087890625, 3.51788330078125, 3.7392578125, 3.96063232421875, 4.1820068359375, 4.40338134765625, 4.624755859375, 4.84613037109375, 5.0675048828125, 5.28887939453125, 5.51025390625, 5.73162841796875, 5.9530029296875, 6.17437744140625, 6.395751953125, 6.61712646484375, 6.8385009765625, 7.05987548828125, 7.28125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [9.0, 0.0, 0.0, 12.0, 19.0, 14.0, 27.0, 19.0, 33.0, 62.0, 32.0, 71.0, 159.0, 175.0, 219.0, 311.0, 532.0, 678.0, 1058.0, 1566.0, 2353.0, 3170.0, 4743.0, 7200.0, 11652.0, 18402.0, 29579.0, 47705.0, 78133.0, 135718.0, 252716.0, 667276.0, 3942583.0, 540929.0, 228047.0, 123315.0, 72449.0, 44030.0, 27363.0, 16878.0, 10908.0, 6918.0, 4638.0, 3016.0, 2103.0, 1391.0, 976.0, 658.0, 474.0, 339.0, 214.0, 152.0, 103.0, 90.0, 67.0, 49.0, 51.0, 24.0, 0.0, 22.0, 4.0, 4.0, 5.0, 13.0], "bins": [-3.228515625, -3.128936767578125, -3.02935791015625, -2.929779052734375, -2.8302001953125, -2.730621337890625, -2.63104248046875, -2.531463623046875, -2.431884765625, -2.332305908203125, -2.23272705078125, -2.133148193359375, -2.0335693359375, -1.933990478515625, -1.83441162109375, -1.734832763671875, -1.63525390625, -1.535675048828125, -1.43609619140625, -1.336517333984375, -1.2369384765625, -1.137359619140625, -1.03778076171875, -0.938201904296875, -0.838623046875, -0.739044189453125, -0.63946533203125, -0.539886474609375, -0.4403076171875, -0.340728759765625, -0.24114990234375, -0.141571044921875, -0.0419921875, 0.057586669921875, 0.15716552734375, 0.256744384765625, 0.3563232421875, 0.455902099609375, 0.55548095703125, 0.655059814453125, 0.754638671875, 0.854217529296875, 0.95379638671875, 1.053375244140625, 1.1529541015625, 1.252532958984375, 1.35211181640625, 1.451690673828125, 1.55126953125, 1.650848388671875, 1.75042724609375, 1.850006103515625, 1.9495849609375, 2.049163818359375, 2.14874267578125, 2.248321533203125, 2.347900390625, 2.447479248046875, 2.54705810546875, 2.646636962890625, 2.7462158203125, 2.845794677734375, 2.94537353515625, 3.044952392578125, 3.14453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 4.0, 11.0, 5.0, 6.0, 22.0, 13.0, 19.0, 15.0, 27.0, 40.0, 26.0, 30.0, 37.0, 46.0, 46.0, 52.0, 104.0, 354.0, 530.0, 162.0, 70.0, 54.0, 52.0, 44.0, 39.0, 33.0, 23.0, 22.0, 20.0, 28.0, 16.0, 18.0, 12.0, 16.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.44232177734375, -5.2674560546875, -5.09259033203125, -4.917724609375, -4.74285888671875, -4.5679931640625, -4.39312744140625, -4.21826171875, -4.04339599609375, -3.8685302734375, -3.69366455078125, -3.518798828125, -3.34393310546875, -3.1690673828125, -2.99420166015625, -2.8193359375, -2.64447021484375, -2.4696044921875, -2.29473876953125, -2.119873046875, -1.94500732421875, -1.7701416015625, -1.59527587890625, -1.42041015625, -1.24554443359375, -1.0706787109375, -0.89581298828125, -0.720947265625, -0.54608154296875, -0.3712158203125, -0.19635009765625, -0.021484375, 0.15338134765625, 0.3282470703125, 0.50311279296875, 0.677978515625, 0.85284423828125, 1.0277099609375, 1.20257568359375, 1.37744140625, 1.55230712890625, 1.7271728515625, 1.90203857421875, 2.076904296875, 2.25177001953125, 2.4266357421875, 2.60150146484375, 2.7763671875, 2.95123291015625, 3.1260986328125, 3.30096435546875, 3.475830078125, 3.65069580078125, 3.8255615234375, 4.00042724609375, 4.17529296875, 4.35015869140625, 4.5250244140625, 4.69989013671875, 4.874755859375, 5.04962158203125, 5.2244873046875, 5.39935302734375, 5.57421875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 12.0, 6.0, 5.0, 14.0, 27.0, 37.0, 22.0, 33.0, 53.0, 57.0, 55.0, 97.0, 132.0, 117.0, 186.0, 255.0, 349.0, 499.0, 636.0, 806.0, 1258.0, 1856.0, 2673.0, 4456.0, 7543.0, 15317.0, 36407.0, 146945.0, 5910017.0, 99779.0, 29770.0, 12836.0, 6789.0, 3880.0, 2571.0, 1683.0, 1107.0, 821.0, 580.0, 396.0, 344.0, 252.0, 187.0, 131.0, 76.0, 77.0, 59.0, 45.0, 54.0, 46.0, 31.0, 18.0, 10.0, 9.0, 5.0, 8.0, 2.0, 9.0, 0.0, 6.0], "bins": [-9.296875, -9.0098876953125, -8.722900390625, -8.4359130859375, -8.14892578125, -7.8619384765625, -7.574951171875, -7.2879638671875, -7.0009765625, -6.7139892578125, -6.427001953125, -6.1400146484375, -5.85302734375, -5.5660400390625, -5.279052734375, -4.9920654296875, -4.705078125, -4.4180908203125, -4.131103515625, -3.8441162109375, -3.55712890625, -3.2701416015625, -2.983154296875, -2.6961669921875, -2.4091796875, -2.1221923828125, -1.835205078125, -1.5482177734375, -1.26123046875, -0.9742431640625, -0.687255859375, -0.4002685546875, -0.11328125, 0.1737060546875, 0.460693359375, 0.7476806640625, 1.03466796875, 1.3216552734375, 1.608642578125, 1.8956298828125, 2.1826171875, 2.4696044921875, 2.756591796875, 3.0435791015625, 3.33056640625, 3.6175537109375, 3.904541015625, 4.1915283203125, 4.478515625, 4.7655029296875, 5.052490234375, 5.3394775390625, 5.62646484375, 5.9134521484375, 6.200439453125, 6.4874267578125, 6.7744140625, 7.0614013671875, 7.348388671875, 7.6353759765625, 7.92236328125, 8.2093505859375, 8.496337890625, 8.7833251953125, 9.0703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 5.0, 2.0, 7.0, 9.0, 7.0, 11.0, 12.0, 10.0, 16.0, 15.0, 25.0, 20.0, 28.0, 34.0, 44.0, 41.0, 35.0, 49.0, 68.0, 133.0, 340.0, 415.0, 163.0, 85.0, 69.0, 44.0, 48.0, 36.0, 32.0, 29.0, 41.0, 24.0, 25.0, 13.0, 14.0, 10.0, 11.0, 6.0, 10.0, 8.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.416015625, -3.30609130859375, -3.1961669921875, -3.08624267578125, -2.976318359375, -2.86639404296875, -2.7564697265625, -2.64654541015625, -2.53662109375, -2.42669677734375, -2.3167724609375, -2.20684814453125, -2.096923828125, -1.98699951171875, -1.8770751953125, -1.76715087890625, -1.6572265625, -1.54730224609375, -1.4373779296875, -1.32745361328125, -1.217529296875, -1.10760498046875, -0.9976806640625, -0.88775634765625, -0.77783203125, -0.66790771484375, -0.5579833984375, -0.44805908203125, -0.338134765625, -0.22821044921875, -0.1182861328125, -0.00836181640625, 0.1015625, 0.21148681640625, 0.3214111328125, 0.43133544921875, 0.541259765625, 0.65118408203125, 0.7611083984375, 0.87103271484375, 0.98095703125, 1.09088134765625, 1.2008056640625, 1.31072998046875, 1.420654296875, 1.53057861328125, 1.6405029296875, 1.75042724609375, 1.8603515625, 1.97027587890625, 2.0802001953125, 2.19012451171875, 2.300048828125, 2.40997314453125, 2.5198974609375, 2.62982177734375, 2.73974609375, 2.84967041015625, 2.9595947265625, 3.06951904296875, 3.179443359375, 3.28936767578125, 3.3992919921875, 3.50921630859375, 3.619140625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 38.0, 75.0, 362.0, 398.0, 77.0, 30.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.866183280944824, -13.000533103942871, -12.134882926940918, -11.269231796264648, -10.403581619262695, -9.537931442260742, -8.672281265258789, -7.806630611419678, -6.940980434417725, -6.0753302574157715, -5.20967960357666, -4.344029426574707, -3.478379011154175, -2.6127285957336426, -1.7470784187316895, -0.8814277648925781, -0.015777587890625, 0.8498727679252625, 1.71552312374115, 2.5811734199523926, 3.446823835372925, 4.312474250793457, 5.17812442779541, 6.0437750816345215, 6.909425258636475, 7.775075435638428, 8.640726089477539, 9.506376266479492, 10.372026443481445, 11.237676620483398, 12.103326797485352, 12.968977928161621, 13.834627151489258, 14.700277328491211, 15.565927505493164, 16.431577682495117, 17.29722785949707, 18.162879943847656, 19.02853012084961, 19.894180297851562, 20.759830474853516, 21.62548065185547, 22.491130828857422, 23.356781005859375, 24.222431182861328, 25.08808135986328, 25.953731536865234, 26.81938362121582, 27.68503189086914, 28.550682067871094, 29.416332244873047, 30.281982421875, 31.147632598876953, 32.013282775878906, 32.87893295288086, 33.74458312988281, 34.61023712158203, 35.475887298583984, 36.34153747558594, 37.20718765258789, 38.072837829589844, 38.9384880065918, 39.80413818359375, 40.6697883605957, 41.535438537597656]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 9.0, 5.0, 9.0, 17.0, 12.0, 18.0, 16.0, 25.0, 14.0, 30.0, 39.0, 24.0, 28.0, 43.0, 33.0, 45.0, 22.0, 39.0, 44.0, 47.0, 42.0, 43.0, 35.0, 36.0, 34.0, 32.0, 37.0, 27.0, 28.0, 18.0, 21.0, 24.0, 14.0, 19.0, 11.0, 17.0, 13.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.966644763946533, -4.810634613037109, -4.6546244621276855, -4.498614311218262, -4.342604637145996, -4.186594486236572, -4.030584335327148, -3.8745741844177246, -3.718564033508301, -3.562553882598877, -3.406543731689453, -3.2505338191986084, -3.0945236682891846, -2.9385135173797607, -2.782503604888916, -2.626493453979492, -2.4704833030700684, -2.3144731521606445, -2.1584630012512207, -2.002453088760376, -1.8464429378509521, -1.6904327869415283, -1.534422755241394, -1.3784127235412598, -1.222402572631836, -1.066392421722412, -0.9103823900222778, -0.7543722987174988, -0.5983622074127197, -0.4423521161079407, -0.2863420248031616, -0.13033199310302734, 0.02567768096923828, 0.18168777227401733, 0.3376978635787964, 0.49370795488357544, 0.6497180461883545, 0.8057281374931335, 0.9617382287979126, 1.1177482604980469, 1.2737584114074707, 1.4297685623168945, 1.5857785940170288, 1.741788625717163, 1.897798776626587, 2.0538089275360107, 2.2098188400268555, 2.3658289909362793, 2.521839141845703, 2.677849292755127, 2.833859443664551, 2.9898693561553955, 3.1458795070648193, 3.301889657974243, 3.457899570465088, 3.6139097213745117, 3.7699198722839355, 3.9259300231933594, 4.081940174102783, 4.237950325012207, 4.393959999084473, 4.5499701499938965, 4.70598030090332, 4.861990451812744, 5.018000602722168]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 3.0, 6.0, 9.0, 9.0, 11.0, 20.0, 32.0, 37.0, 31.0, 66.0, 76.0, 102.0, 129.0, 177.0, 288.0, 472.0, 663.0, 1149.0, 1865.0, 3293.0, 6333.0, 14010.0, 38173.0, 189674.0, 3824287.0, 73063.0, 21455.0, 8882.0, 4212.0, 2208.0, 1276.0, 795.0, 514.0, 321.0, 208.0, 119.0, 87.0, 61.0, 57.0, 45.0, 19.0, 13.0, 11.0, 4.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0255584716796875, -0.0248720645904541, -0.024185657501220703, -0.023499250411987305, -0.022812843322753906, -0.022126436233520508, -0.02144002914428711, -0.02075362205505371, -0.020067214965820312, -0.019380807876586914, -0.018694400787353516, -0.018007993698120117, -0.01732158660888672, -0.01663517951965332, -0.015948772430419922, -0.015262365341186523, -0.014575958251953125, -0.013889551162719727, -0.013203144073486328, -0.01251673698425293, -0.011830329895019531, -0.011143922805786133, -0.010457515716552734, -0.009771108627319336, -0.009084701538085938, -0.008398294448852539, -0.007711887359619141, -0.007025480270385742, -0.006339073181152344, -0.005652666091918945, -0.004966259002685547, -0.0042798519134521484, -0.00359344482421875, -0.0029070377349853516, -0.002220630645751953, -0.0015342235565185547, -0.0008478164672851562, -0.0001614093780517578, 0.0005249977111816406, 0.001211404800415039, 0.0018978118896484375, 0.002584218978881836, 0.0032706260681152344, 0.003957033157348633, 0.004643440246582031, 0.00532984733581543, 0.006016254425048828, 0.0067026615142822266, 0.007389068603515625, 0.008075475692749023, 0.008761882781982422, 0.00944828987121582, 0.010134696960449219, 0.010821104049682617, 0.011507511138916016, 0.012193918228149414, 0.012880325317382812, 0.013566732406616211, 0.01425313949584961, 0.014939546585083008, 0.015625953674316406, 0.016312360763549805, 0.016998767852783203, 0.0176851749420166, 0.01837158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 8.0, 3.0, 4.0, 8.0, 6.0, 5.0, 10.0, 12.0, 10.0, 11.0, 25.0, 780.0, 16.0, 14.0, 13.0, 9.0, 8.0, 6.0, 8.0, 5.0, 6.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004444122314453125, -0.004296720027923584, -0.004149317741394043, -0.004001915454864502, -0.003854513168334961, -0.00370711088180542, -0.003559708595275879, -0.003412306308746338, -0.003264904022216797, -0.003117501735687256, -0.002970099449157715, -0.002822697162628174, -0.002675294876098633, -0.002527892589569092, -0.0023804903030395508, -0.0022330880165100098, -0.0020856857299804688, -0.0019382834434509277, -0.0017908811569213867, -0.0016434788703918457, -0.0014960765838623047, -0.0013486742973327637, -0.0012012720108032227, -0.0010538697242736816, -0.0009064674377441406, -0.0007590651512145996, -0.0006116628646850586, -0.0004642605781555176, -0.00031685829162597656, -0.00016945600509643555, -2.205371856689453e-05, 0.00012534856796264648, 0.0002727508544921875, 0.0004201531410217285, 0.0005675554275512695, 0.0007149577140808105, 0.0008623600006103516, 0.0010097622871398926, 0.0011571645736694336, 0.0013045668601989746, 0.0014519691467285156, 0.0015993714332580566, 0.0017467737197875977, 0.0018941760063171387, 0.0020415782928466797, 0.0021889805793762207, 0.0023363828659057617, 0.0024837851524353027, 0.0026311874389648438, 0.0027785897254943848, 0.0029259920120239258, 0.003073394298553467, 0.003220796585083008, 0.003368198871612549, 0.00351560115814209, 0.003663003444671631, 0.003810405731201172, 0.003957808017730713, 0.004105210304260254, 0.004252612590789795, 0.004400014877319336, 0.004547417163848877, 0.004694819450378418, 0.004842221736907959, 0.0049896240234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 4.0, 9.0, 7.0, 5.0, 18.0, 29.0, 49.0, 91.0, 146.0, 302.0, 786.0, 2859.0, 16661.0, 208067.0, 3694681.0, 247930.0, 18163.0, 2937.0, 807.0, 339.0, 143.0, 91.0, 49.0, 25.0, 18.0, 13.0, 14.0, 5.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.039825439453125, -0.03870439529418945, -0.037583351135253906, -0.03646230697631836, -0.03534126281738281, -0.034220218658447266, -0.03309917449951172, -0.03197813034057617, -0.030857086181640625, -0.029736042022705078, -0.02861499786376953, -0.027493953704833984, -0.026372909545898438, -0.02525186538696289, -0.024130821228027344, -0.023009777069091797, -0.02188873291015625, -0.020767688751220703, -0.019646644592285156, -0.01852560043334961, -0.017404556274414062, -0.016283512115478516, -0.015162467956542969, -0.014041423797607422, -0.012920379638671875, -0.011799335479736328, -0.010678291320800781, -0.009557247161865234, -0.008436203002929688, -0.007315158843994141, -0.006194114685058594, -0.005073070526123047, -0.0039520263671875, -0.002830982208251953, -0.0017099380493164062, -0.0005888938903808594, 0.0005321502685546875, 0.0016531944274902344, 0.0027742385864257812, 0.003895282745361328, 0.005016326904296875, 0.006137371063232422, 0.007258415222167969, 0.008379459381103516, 0.009500503540039062, 0.01062154769897461, 0.011742591857910156, 0.012863636016845703, 0.01398468017578125, 0.015105724334716797, 0.016226768493652344, 0.01734781265258789, 0.018468856811523438, 0.019589900970458984, 0.02071094512939453, 0.021831989288330078, 0.022953033447265625, 0.024074077606201172, 0.02519512176513672, 0.026316165924072266, 0.027437210083007812, 0.02855825424194336, 0.029679298400878906, 0.030800342559814453, 0.03192138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 8.0, 3.0, 12.0, 10.0, 16.0, 22.0, 23.0, 35.0, 62.0, 78.0, 117.0, 166.0, 240.0, 431.0, 820.0, 828.0, 407.0, 256.0, 139.0, 114.0, 74.0, 54.0, 43.0, 39.0, 26.0, 12.0, 17.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00598907470703125, -0.005775034427642822, -0.0055609941482543945, -0.005346953868865967, -0.005132913589477539, -0.004918873310089111, -0.004704833030700684, -0.004490792751312256, -0.004276752471923828, -0.0040627121925354, -0.0038486719131469727, -0.003634631633758545, -0.003420591354370117, -0.0032065510749816895, -0.0029925107955932617, -0.002778470516204834, -0.0025644302368164062, -0.0023503899574279785, -0.0021363496780395508, -0.001922309398651123, -0.0017082691192626953, -0.0014942288398742676, -0.0012801885604858398, -0.0010661482810974121, -0.0008521080017089844, -0.0006380677223205566, -0.0004240274429321289, -0.00020998716354370117, 4.0531158447265625e-06, 0.0002180933952331543, 0.00043213367462158203, 0.0006461739540100098, 0.0008602142333984375, 0.0010742545127868652, 0.001288294792175293, 0.0015023350715637207, 0.0017163753509521484, 0.0019304156303405762, 0.002144455909729004, 0.0023584961891174316, 0.0025725364685058594, 0.002786576747894287, 0.003000617027282715, 0.0032146573066711426, 0.0034286975860595703, 0.003642737865447998, 0.0038567781448364258, 0.0040708184242248535, 0.004284858703613281, 0.004498898983001709, 0.004712939262390137, 0.0049269795417785645, 0.005141019821166992, 0.00535506010055542, 0.005569100379943848, 0.005783140659332275, 0.005997180938720703, 0.006211221218109131, 0.006425261497497559, 0.006639301776885986, 0.006853342056274414, 0.007067382335662842, 0.0072814226150512695, 0.007495462894439697, 0.007709503173828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 15.0, 18.0, 33.0, 60.0, 90.0, 138.0, 154.0, 149.0, 111.0, 96.0, 41.0, 30.0, 22.0, 16.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032929886132478714, -0.031552888453006744, -0.030175894498825073, -0.028798898681998253, -0.027421902865171432, -0.026044907048344612, -0.024667911231517792, -0.02329091541469097, -0.02191391959786415, -0.02053692378103733, -0.01915992796421051, -0.01778293214738369, -0.01640593633055687, -0.01502894051373005, -0.013651944696903229, -0.012274948880076408, -0.010897953063249588, -0.009520957246422768, -0.008143961429595947, -0.006766965612769127, -0.0053899697959423065, -0.004012973979115486, -0.0026359781622886658, -0.0012589823454618454, 0.00011801347136497498, 0.0014950092881917953, 0.0028720051050186157, 0.004249000921845436, 0.0056259967386722565, 0.007002992555499077, 0.008379988372325897, 0.009756984189152718, 0.011133983731269836, 0.012510979548096657, 0.013887975364923477, 0.015264971181750298, 0.016641966998577118, 0.01801896281540394, 0.01939595863223076, 0.02077295444905758, 0.0221499502658844, 0.02352694608271122, 0.02490394189953804, 0.02628093771636486, 0.02765793353319168, 0.0290349293500185, 0.03041192516684532, 0.03178892284631729, 0.03316591680049896, 0.034542910754680634, 0.0359199084341526, 0.03729690611362457, 0.038673900067806244, 0.040050894021987915, 0.041427891701459885, 0.042804889380931854, 0.044181883335113525, 0.0455588772892952, 0.046935874968767166, 0.048312872648239136, 0.04968986660242081, 0.05106686055660248, 0.05244385823607445, 0.05382085591554642, 0.05519784986972809]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 12.0, 15.0, 24.0, 17.0, 29.0, 22.0, 38.0, 35.0, 43.0, 50.0, 46.0, 48.0, 45.0, 60.0, 47.0, 46.0, 57.0, 45.0, 49.0, 29.0, 43.0, 32.0, 30.0, 24.0, 21.0, 17.0, 12.0, 15.0, 11.0, 6.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02670830488204956, -0.02584611438214779, -0.024983923882246017, -0.024121733382344246, -0.023259542882442474, -0.022397352382540703, -0.02153516188263893, -0.02067297138273716, -0.019810780882835388, -0.018948590382933617, -0.018086399883031845, -0.017224209383130074, -0.016362018883228302, -0.01549982838332653, -0.014637637883424759, -0.013775447383522987, -0.012913256883621216, -0.012051066383719444, -0.011188875883817673, -0.010326685383915901, -0.00946449488401413, -0.008602304384112358, -0.0077401138842105865, -0.006877923384308815, -0.0060157328844070435, -0.005153542384505272, -0.0042913518846035, -0.003429161384701729, -0.0025669708847999573, -0.0017047803848981857, -0.0008425898849964142, 1.960061490535736e-05, 0.0008817911148071289, 0.0017439816147089005, 0.002606172114610672, 0.0034683626145124435, 0.004330553114414215, 0.005192743614315987, 0.006054934114217758, 0.00691712461411953, 0.007779315114021301, 0.008641505613923073, 0.009503696113824844, 0.010365886613726616, 0.011228077113628387, 0.012090267613530159, 0.01295245811343193, 0.013814648613333702, 0.014676839113235474, 0.015539029613137245, 0.016401220113039017, 0.01726341061294079, 0.01812560111284256, 0.01898779161274433, 0.019849982112646103, 0.020712172612547874, 0.021574363112449646, 0.022436553612351418, 0.02329874411225319, 0.02416093461215496, 0.025023125112056732, 0.025885315611958504, 0.026747506111860275, 0.027609696611762047, 0.02847188711166382]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 10.0, 7.0, 10.0, 16.0, 28.0, 25.0, 54.0, 70.0, 90.0, 127.0, 170.0, 230.0, 341.0, 472.0, 662.0, 987.0, 1485.0, 2159.0, 3598.0, 6139.0, 11468.0, 27766.0, 595521.0, 345126.0, 25275.0, 10935.0, 5704.0, 3445.0, 2154.0, 1345.0, 932.0, 599.0, 453.0, 336.0, 194.0, 182.0, 120.0, 82.0, 64.0, 40.0, 36.0, 22.0, 20.0, 10.0, 9.0, 10.0, 4.0, 3.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.034210205078125, -0.033139705657958984, -0.03206920623779297, -0.030998706817626953, -0.029928207397460938, -0.028857707977294922, -0.027787208557128906, -0.02671670913696289, -0.025646209716796875, -0.02457571029663086, -0.023505210876464844, -0.022434711456298828, -0.021364212036132812, -0.020293712615966797, -0.01922321319580078, -0.018152713775634766, -0.01708221435546875, -0.016011714935302734, -0.014941215515136719, -0.013870716094970703, -0.012800216674804688, -0.011729717254638672, -0.010659217834472656, -0.00958871841430664, -0.008518218994140625, -0.007447719573974609, -0.006377220153808594, -0.005306720733642578, -0.0042362213134765625, -0.003165721893310547, -0.0020952224731445312, -0.0010247230529785156, 4.57763671875e-05, 0.0011162757873535156, 0.0021867752075195312, 0.003257274627685547, 0.0043277740478515625, 0.005398273468017578, 0.006468772888183594, 0.007539272308349609, 0.008609771728515625, 0.00968027114868164, 0.010750770568847656, 0.011821269989013672, 0.012891769409179688, 0.013962268829345703, 0.015032768249511719, 0.016103267669677734, 0.01717376708984375, 0.018244266510009766, 0.01931476593017578, 0.020385265350341797, 0.021455764770507812, 0.022526264190673828, 0.023596763610839844, 0.02466726303100586, 0.025737762451171875, 0.02680826187133789, 0.027878761291503906, 0.028949260711669922, 0.030019760131835938, 0.031090259552001953, 0.03216075897216797, 0.033231258392333984, 0.0343017578125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 5.0, 8.0, 2.0, 11.0, 9.0, 15.0, 69.0, 235.0, 351.0, 142.0, 40.0, 19.0, 9.0, 8.0, 7.0, 6.0, 7.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004428863525390625, -0.004282653331756592, -0.004136443138122559, -0.003990232944488525, -0.003844022750854492, -0.003697812557220459, -0.0035516023635864258, -0.0034053921699523926, -0.0032591819763183594, -0.003112971782684326, -0.002966761589050293, -0.0028205513954162598, -0.0026743412017822266, -0.0025281310081481934, -0.00238192081451416, -0.002235710620880127, -0.0020895004272460938, -0.0019432902336120605, -0.0017970800399780273, -0.0016508698463439941, -0.001504659652709961, -0.0013584494590759277, -0.0012122392654418945, -0.0010660290718078613, -0.0009198188781738281, -0.0007736086845397949, -0.0006273984909057617, -0.0004811882972717285, -0.0003349781036376953, -0.0001887679100036621, -4.2557716369628906e-05, 0.0001036524772644043, 0.0002498626708984375, 0.0003960728645324707, 0.0005422830581665039, 0.0006884932518005371, 0.0008347034454345703, 0.0009809136390686035, 0.0011271238327026367, 0.00127333402633667, 0.0014195442199707031, 0.0015657544136047363, 0.0017119646072387695, 0.0018581748008728027, 0.002004384994506836, 0.002150595188140869, 0.0022968053817749023, 0.0024430155754089355, 0.0025892257690429688, 0.002735435962677002, 0.002881646156311035, 0.0030278563499450684, 0.0031740665435791016, 0.0033202767372131348, 0.003466486930847168, 0.003612697124481201, 0.0037589073181152344, 0.0039051175117492676, 0.004051327705383301, 0.004197537899017334, 0.004343748092651367, 0.0044899582862854, 0.004636168479919434, 0.004782378673553467, 0.0049285888671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 11.0, 8.0, 26.0, 30.0, 30.0, 41.0, 71.0, 70.0, 126.0, 197.0, 401.0, 700.0, 1285.0, 3241.0, 10739.0, 166868.0, 831751.0, 24042.0, 4869.0, 1971.0, 823.0, 463.0, 267.0, 140.0, 126.0, 74.0, 50.0, 37.0, 22.0, 11.0, 12.0, 14.0, 8.0, 2.0, 5.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0908203125, -0.0882406234741211, -0.08566093444824219, -0.08308124542236328, -0.08050155639648438, -0.07792186737060547, -0.07534217834472656, -0.07276248931884766, -0.07018280029296875, -0.06760311126708984, -0.06502342224121094, -0.06244373321533203, -0.059864044189453125, -0.05728435516357422, -0.05470466613769531, -0.052124977111816406, -0.0495452880859375, -0.046965599060058594, -0.04438591003417969, -0.04180622100830078, -0.039226531982421875, -0.03664684295654297, -0.03406715393066406, -0.031487464904785156, -0.02890777587890625, -0.026328086853027344, -0.023748397827148438, -0.02116870880126953, -0.018589019775390625, -0.01600933074951172, -0.013429641723632812, -0.010849952697753906, -0.008270263671875, -0.005690574645996094, -0.0031108856201171875, -0.0005311965942382812, 0.002048492431640625, 0.004628181457519531, 0.0072078704833984375, 0.009787559509277344, 0.01236724853515625, 0.014946937561035156, 0.017526626586914062, 0.02010631561279297, 0.022686004638671875, 0.02526569366455078, 0.027845382690429688, 0.030425071716308594, 0.0330047607421875, 0.035584449768066406, 0.03816413879394531, 0.04074382781982422, 0.043323516845703125, 0.04590320587158203, 0.04848289489746094, 0.051062583923339844, 0.05364227294921875, 0.056221961975097656, 0.05880165100097656, 0.06138134002685547, 0.06396102905273438, 0.06654071807861328, 0.06912040710449219, 0.0717000961303711, 0.07427978515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 7.0, 17.0, 10.0, 15.0, 14.0, 14.0, 15.0, 30.0, 28.0, 29.0, 19.0, 31.0, 38.0, 34.0, 31.0, 43.0, 53.0, 38.0, 35.0, 43.0, 38.0, 41.0, 34.0, 31.0, 23.0, 30.0, 24.0, 29.0, 26.0, 22.0, 17.0, 31.0, 16.0, 24.0, 6.0, 9.0, 10.0, 8.0, 6.0, 7.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01751708984375, -0.016912221908569336, -0.016307353973388672, -0.015702486038208008, -0.015097618103027344, -0.01449275016784668, -0.013887882232666016, -0.013283014297485352, -0.012678146362304688, -0.012073278427124023, -0.01146841049194336, -0.010863542556762695, -0.010258674621582031, -0.009653806686401367, -0.009048938751220703, -0.008444070816040039, -0.007839202880859375, -0.007234334945678711, -0.006629467010498047, -0.006024599075317383, -0.005419731140136719, -0.004814863204956055, -0.004209995269775391, -0.0036051273345947266, -0.0030002593994140625, -0.0023953914642333984, -0.0017905235290527344, -0.0011856555938720703, -0.0005807876586914062, 2.4080276489257812e-05, 0.0006289482116699219, 0.001233816146850586, 0.00183868408203125, 0.002443552017211914, 0.003048419952392578, 0.003653287887573242, 0.004258155822753906, 0.00486302375793457, 0.005467891693115234, 0.0060727596282958984, 0.0066776275634765625, 0.0072824954986572266, 0.00788736343383789, 0.008492231369018555, 0.009097099304199219, 0.009701967239379883, 0.010306835174560547, 0.010911703109741211, 0.011516571044921875, 0.012121438980102539, 0.012726306915283203, 0.013331174850463867, 0.013936042785644531, 0.014540910720825195, 0.01514577865600586, 0.015750646591186523, 0.016355514526367188, 0.01696038246154785, 0.017565250396728516, 0.01817011833190918, 0.018774986267089844, 0.019379854202270508, 0.019984722137451172, 0.020589590072631836, 0.0211944580078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 5.0, 13.0, 18.0, 26.0, 24.0, 65.0, 120.0, 251.0, 668.0, 2246.0, 17242.0, 988102.0, 35251.0, 3105.0, 792.0, 289.0, 141.0, 87.0, 36.0, 26.0, 16.0, 18.0, 5.0, 2.0, 1.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07763671875, -0.07557201385498047, -0.07350730895996094, -0.0714426040649414, -0.06937789916992188, -0.06731319427490234, -0.06524848937988281, -0.06318378448486328, -0.06111907958984375, -0.05905437469482422, -0.05698966979980469, -0.054924964904785156, -0.052860260009765625, -0.050795555114746094, -0.04873085021972656, -0.04666614532470703, -0.0446014404296875, -0.04253673553466797, -0.04047203063964844, -0.038407325744628906, -0.036342620849609375, -0.034277915954589844, -0.03221321105957031, -0.03014850616455078, -0.02808380126953125, -0.02601909637451172, -0.023954391479492188, -0.021889686584472656, -0.019824981689453125, -0.017760276794433594, -0.015695571899414062, -0.013630867004394531, -0.011566162109375, -0.009501457214355469, -0.0074367523193359375, -0.005372047424316406, -0.003307342529296875, -0.0012426376342773438, 0.0008220672607421875, 0.0028867721557617188, 0.00495147705078125, 0.007016181945800781, 0.009080886840820312, 0.011145591735839844, 0.013210296630859375, 0.015275001525878906, 0.017339706420898438, 0.01940441131591797, 0.0214691162109375, 0.02353382110595703, 0.025598526000976562, 0.027663230895996094, 0.029727935791015625, 0.031792640686035156, 0.03385734558105469, 0.03592205047607422, 0.03798675537109375, 0.04005146026611328, 0.04211616516113281, 0.044180870056152344, 0.046245574951171875, 0.048310279846191406, 0.05037498474121094, 0.05243968963623047, 0.05450439453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 9.0, 9.0, 8.0, 9.0, 26.0, 31.0, 29.0, 29.0, 49.0, 64.0, 85.0, 91.0, 114.0, 88.0, 91.0, 41.0, 46.0, 37.0, 26.0, 20.0, 12.0, 6.0, 8.0, 6.0, 8.0, 10.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002155303955078125, -0.0020920783281326294, -0.002028852701187134, -0.001965627074241638, -0.0019024014472961426, -0.001839175820350647, -0.0017759501934051514, -0.0017127245664596558, -0.0016494989395141602, -0.0015862733125686646, -0.001523047685623169, -0.0014598220586776733, -0.0013965964317321777, -0.0013333708047866821, -0.0012701451778411865, -0.001206919550895691, -0.0011436939239501953, -0.0010804682970046997, -0.001017242670059204, -0.0009540170431137085, -0.0008907914161682129, -0.0008275657892227173, -0.0007643401622772217, -0.0007011145353317261, -0.0006378889083862305, -0.0005746632814407349, -0.0005114376544952393, -0.00044821202754974365, -0.00038498640060424805, -0.00032176077365875244, -0.00025853514671325684, -0.00019530951976776123, -0.00013208389282226562, -6.885826587677002e-05, -5.632638931274414e-06, 5.759298801422119e-05, 0.0001208186149597168, 0.0001840442419052124, 0.000247269868850708, 0.0003104954957962036, 0.0003737211227416992, 0.0004369467496871948, 0.0005001723766326904, 0.000563398003578186, 0.0006266236305236816, 0.0006898492574691772, 0.0007530748844146729, 0.0008163005113601685, 0.0008795261383056641, 0.0009427517652511597, 0.0010059773921966553, 0.0010692030191421509, 0.0011324286460876465, 0.001195654273033142, 0.0012588798999786377, 0.0013221055269241333, 0.001385331153869629, 0.0014485567808151245, 0.0015117824077606201, 0.0015750080347061157, 0.0016382336616516113, 0.001701459288597107, 0.0017646849155426025, 0.0018279105424880981, 0.0018911361694335938]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 17.0, 16.0, 27.0, 41.0, 69.0, 176.0, 433.0, 1504.0, 6324.0, 51823.0, 892137.0, 84994.0, 8130.0, 1862.0, 574.0, 225.0, 98.0, 48.0, 26.0, 11.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030103683471679688, -0.028926849365234375, -0.027750015258789062, -0.02657318115234375, -0.025396347045898438, -0.024219512939453125, -0.023042678833007812, -0.0218658447265625, -0.020689010620117188, -0.019512176513671875, -0.018335342407226562, -0.01715850830078125, -0.015981674194335938, -0.014804840087890625, -0.013628005981445312, -0.012451171875, -0.011274337768554688, -0.010097503662109375, -0.008920669555664062, -0.00774383544921875, -0.0065670013427734375, -0.005390167236328125, -0.0042133331298828125, -0.0030364990234375, -0.0018596649169921875, -0.000682830810546875, 0.0004940032958984375, 0.00167083740234375, 0.0028476715087890625, 0.004024505615234375, 0.0052013397216796875, 0.006378173828125, 0.0075550079345703125, 0.008731842041015625, 0.009908676147460938, 0.01108551025390625, 0.012262344360351562, 0.013439178466796875, 0.014616012573242188, 0.0157928466796875, 0.016969680786132812, 0.018146514892578125, 0.019323348999023438, 0.02050018310546875, 0.021677017211914062, 0.022853851318359375, 0.024030685424804688, 0.02520751953125, 0.026384353637695312, 0.027561187744140625, 0.028738021850585938, 0.02991485595703125, 0.031091690063476562, 0.032268524169921875, 0.03344535827636719, 0.0346221923828125, 0.03579902648925781, 0.036975860595703125, 0.03815269470214844, 0.03932952880859375, 0.04050636291503906, 0.041683197021484375, 0.04286003112792969, 0.044036865234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 11.0, 15.0, 11.0, 14.0, 15.0, 30.0, 56.0, 55.0, 66.0, 80.0, 110.0, 104.0, 84.0, 67.0, 65.0, 46.0, 37.0, 28.0, 21.0, 15.0, 14.0, 6.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01605224609375, -0.01554250717163086, -0.015032768249511719, -0.014523029327392578, -0.014013290405273438, -0.013503551483154297, -0.012993812561035156, -0.012484073638916016, -0.011974334716796875, -0.011464595794677734, -0.010954856872558594, -0.010445117950439453, -0.009935379028320312, -0.009425640106201172, -0.008915901184082031, -0.00840616226196289, -0.00789642333984375, -0.007386684417724609, -0.006876945495605469, -0.006367206573486328, -0.0058574676513671875, -0.005347728729248047, -0.004837989807128906, -0.004328250885009766, -0.003818511962890625, -0.0033087730407714844, -0.0027990341186523438, -0.002289295196533203, -0.0017795562744140625, -0.0012698173522949219, -0.0007600784301757812, -0.0002503395080566406, 0.0002593994140625, 0.0007691383361816406, 0.0012788772583007812, 0.0017886161804199219, 0.0022983551025390625, 0.002808094024658203, 0.0033178329467773438, 0.0038275718688964844, 0.004337310791015625, 0.004847049713134766, 0.005356788635253906, 0.005866527557373047, 0.0063762664794921875, 0.006886005401611328, 0.007395744323730469, 0.00790548324584961, 0.00841522216796875, 0.00892496109008789, 0.009434700012207031, 0.009944438934326172, 0.010454177856445312, 0.010963916778564453, 0.011473655700683594, 0.011983394622802734, 0.012493133544921875, 0.013002872467041016, 0.013512611389160156, 0.014022350311279297, 0.014532089233398438, 0.015041828155517578, 0.015551567077636719, 0.01606130599975586, 0.016571044921875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 28.0, 229.0, 631.0, 59.0, 17.0, 14.0, 5.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8714686632156372, -0.8435510993003845, -0.8156334757804871, -0.7877159118652344, -0.7597983479499817, -0.731880784034729, -0.7039631605148315, -0.6760455965995789, -0.6481280326843262, -0.6202104687690735, -0.592292845249176, -0.5643752813339233, -0.5364577174186707, -0.508540153503418, -0.4806225299835205, -0.4527049660682678, -0.42478734254837036, -0.3968697488307953, -0.3689521849155426, -0.34103459119796753, -0.31311702728271484, -0.28519943356513977, -0.2572818398475647, -0.22936426103115082, -0.20144668221473694, -0.17352910339832306, -0.14561152458190918, -0.1176939308643341, -0.08977635204792023, -0.06185877323150635, -0.033941179513931274, -0.006023600697517395, 0.02189391851425171, 0.04981150105595589, 0.07772908359766006, 0.10564666986465454, 0.13356424868106842, 0.1614818274974823, 0.18939942121505737, 0.21731700003147125, 0.24523457884788513, 0.2731521725654602, 0.3010697364807129, 0.32898733019828796, 0.35690492391586304, 0.3848224878311157, 0.4127400815486908, 0.44065767526626587, 0.46857523918151855, 0.49649283289909363, 0.5244104266166687, 0.5523279905319214, 0.5802455544471741, 0.6081631183624268, 0.6360807418823242, 0.6639983057975769, 0.6919158697128296, 0.7198334336280823, 0.7477510571479797, 0.7756686210632324, 0.8035861849784851, 0.8315037488937378, 0.8594213724136353, 0.8873389363288879, 0.9152565598487854]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 1.0, 4.0, 4.0, 4.0, 6.0, 2.0, 5.0, 10.0, 15.0, 22.0, 47.0, 79.0, 114.0, 159.0, 152.0, 138.0, 87.0, 46.0, 35.0, 23.0, 12.0, 5.0, 3.0, 4.0, 4.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4582235813140869, -0.4447319805622101, -0.43124035000801086, -0.41774874925613403, -0.4042571485042572, -0.39076554775238037, -0.37727391719818115, -0.3637823164463043, -0.3502907156944275, -0.33679911494255066, -0.32330748438835144, -0.3098158836364746, -0.2963242828845978, -0.28283268213272095, -0.26934105157852173, -0.2558494508266449, -0.24235783517360687, -0.22886621952056885, -0.21537461876869202, -0.201883003115654, -0.18839140236377716, -0.17489978671073914, -0.1614081859588623, -0.14791657030582428, -0.13442495465278625, -0.12093334645032883, -0.1074417382478714, -0.09395012259483337, -0.08045852184295654, -0.06696690618991852, -0.05347529798746109, -0.03998368978500366, -0.02649208903312683, -0.013000479899346828, 0.0004911292344331741, 0.013982739299535751, 0.02747434750199318, 0.040965959429740906, 0.054457567632198334, 0.06794917583465576, 0.08144078403711319, 0.09493239223957062, 0.10842400044202805, 0.12191560864448547, 0.1354072242975235, 0.14889883995056152, 0.16239044070243835, 0.17588204145431519, 0.1893736571073532, 0.20286527276039124, 0.21635687351226807, 0.2298484891653061, 0.24334008991718292, 0.25683170557022095, 0.2703233063220978, 0.2838149070739746, 0.29730653762817383, 0.31079813838005066, 0.3242897689342499, 0.3377813696861267, 0.35127297043800354, 0.36476457118988037, 0.3782562017440796, 0.3917478024959564, 0.40523940324783325]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 10.0, 8.0, 11.0, 16.0, 11.0, 24.0, 26.0, 43.0, 108.0, 729.0, 23959.0, 4166997.0, 2032.0, 108.0, 57.0, 37.0, 21.0, 17.0, 15.0, 10.0, 9.0, 5.0, 3.0, 6.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.109375, -2.0543060302734375, -1.999237060546875, -1.9441680908203125, -1.88909912109375, -1.8340301513671875, -1.778961181640625, -1.7238922119140625, -1.6688232421875, -1.6137542724609375, -1.558685302734375, -1.5036163330078125, -1.44854736328125, -1.3934783935546875, -1.338409423828125, -1.2833404541015625, -1.228271484375, -1.1732025146484375, -1.118133544921875, -1.0630645751953125, -1.00799560546875, -0.9529266357421875, -0.897857666015625, -0.8427886962890625, -0.7877197265625, -0.7326507568359375, -0.677581787109375, -0.6225128173828125, -0.56744384765625, -0.5123748779296875, -0.457305908203125, -0.4022369384765625, -0.34716796875, -0.2920989990234375, -0.237030029296875, -0.1819610595703125, -0.12689208984375, -0.0718231201171875, -0.016754150390625, 0.0383148193359375, 0.0933837890625, 0.1484527587890625, 0.203521728515625, 0.2585906982421875, 0.31365966796875, 0.3687286376953125, 0.423797607421875, 0.4788665771484375, 0.533935546875, 0.5890045166015625, 0.644073486328125, 0.6991424560546875, 0.75421142578125, 0.8092803955078125, 0.864349365234375, 0.9194183349609375, 0.9744873046875, 1.0295562744140625, 1.084625244140625, 1.1396942138671875, 1.19476318359375, 1.2498321533203125, 1.304901123046875, 1.3599700927734375, 1.4150390625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 11.0, 5.0, 8.0, 10.0, 13.0, 11.0, 27.0, 34.0, 78.0, 107.0, 158.0, 157.0, 97.0, 85.0, 59.0, 30.0, 11.0, 10.0, 11.0, 7.0, 4.0, 7.0, 9.0, 3.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003025054931640625, -0.0029384493827819824, -0.00285184383392334, -0.0027652382850646973, -0.0026786327362060547, -0.002592027187347412, -0.0025054216384887695, -0.002418816089630127, -0.0023322105407714844, -0.002245604991912842, -0.0021589994430541992, -0.0020723938941955566, -0.001985788345336914, -0.0018991827964782715, -0.001812577247619629, -0.0017259716987609863, -0.0016393661499023438, -0.0015527606010437012, -0.0014661550521850586, -0.001379549503326416, -0.0012929439544677734, -0.0012063384056091309, -0.0011197328567504883, -0.0010331273078918457, -0.0009465217590332031, -0.0008599162101745605, -0.000773310661315918, -0.0006867051124572754, -0.0006000995635986328, -0.0005134940147399902, -0.00042688846588134766, -0.0003402829170227051, -0.0002536773681640625, -0.00016707181930541992, -8.046627044677734e-05, 6.139278411865234e-06, 9.274482727050781e-05, 0.0001793503761291504, 0.00026595592498779297, 0.00035256147384643555, 0.0004391670227050781, 0.0005257725715637207, 0.0006123781204223633, 0.0006989836692810059, 0.0007855892181396484, 0.000872194766998291, 0.0009588003158569336, 0.0010454058647155762, 0.0011320114135742188, 0.0012186169624328613, 0.001305222511291504, 0.0013918280601501465, 0.001478433609008789, 0.0015650391578674316, 0.0016516447067260742, 0.0017382502555847168, 0.0018248558044433594, 0.001911461353302002, 0.0019980669021606445, 0.002084672451019287, 0.0021712779998779297, 0.0022578835487365723, 0.002344489097595215, 0.0024310946464538574, 0.0025177001953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 6.0, 10.0, 7.0, 10.0, 13.0, 25.0, 23.0, 29.0, 39.0, 49.0, 64.0, 76.0, 96.0, 142.0, 220.0, 1362.0, 4033475.0, 157222.0, 643.0, 178.0, 141.0, 100.0, 89.0, 49.0, 56.0, 24.0, 34.0, 24.0, 15.0, 24.0, 6.0, 5.0, 3.0, 11.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26953125, -0.2595024108886719, -0.24947357177734375, -0.23944473266601562, -0.2294158935546875, -0.21938705444335938, -0.20935821533203125, -0.19932937622070312, -0.189300537109375, -0.17927169799804688, -0.16924285888671875, -0.15921401977539062, -0.1491851806640625, -0.13915634155273438, -0.12912750244140625, -0.11909866333007812, -0.10906982421875, -0.09904098510742188, -0.08901214599609375, -0.07898330688476562, -0.0689544677734375, -0.058925628662109375, -0.04889678955078125, -0.038867950439453125, -0.028839111328125, -0.018810272216796875, -0.00878143310546875, 0.001247406005859375, 0.0112762451171875, 0.021305084228515625, 0.03133392333984375, 0.041362762451171875, 0.0513916015625, 0.061420440673828125, 0.07144927978515625, 0.08147811889648438, 0.0915069580078125, 0.10153579711914062, 0.11156463623046875, 0.12159347534179688, 0.131622314453125, 0.14165115356445312, 0.15167999267578125, 0.16170883178710938, 0.1717376708984375, 0.18176651000976562, 0.19179534912109375, 0.20182418823242188, 0.21185302734375, 0.22188186645507812, 0.23191070556640625, 0.24193954467773438, 0.2519683837890625, 0.2619972229003906, 0.27202606201171875, 0.2820549011230469, 0.292083740234375, 0.3021125793457031, 0.31214141845703125, 0.3221702575683594, 0.3321990966796875, 0.3422279357910156, 0.35225677490234375, 0.3622856140136719, 0.372314453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 7.0, 7.0, 12.0, 12.0, 14.0, 15.0, 22.0, 31.0, 57.0, 77.0, 101.0, 131.0, 230.0, 325.0, 547.0, 899.0, 505.0, 287.0, 210.0, 186.0, 110.0, 78.0, 55.0, 34.0, 21.0, 26.0, 19.0, 12.0, 7.0, 7.0, 2.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004611968994140625, -0.0044699907302856445, -0.004328012466430664, -0.004186034202575684, -0.004044055938720703, -0.0039020776748657227, -0.003760099411010742, -0.0036181211471557617, -0.0034761428833007812, -0.0033341646194458008, -0.0031921863555908203, -0.00305020809173584, -0.0029082298278808594, -0.002766251564025879, -0.0026242733001708984, -0.002482295036315918, -0.0023403167724609375, -0.002198338508605957, -0.0020563602447509766, -0.001914381980895996, -0.0017724037170410156, -0.0016304254531860352, -0.0014884471893310547, -0.0013464689254760742, -0.0012044906616210938, -0.0010625123977661133, -0.0009205341339111328, -0.0007785558700561523, -0.0006365776062011719, -0.0004945993423461914, -0.00035262107849121094, -0.00021064281463623047, -6.866455078125e-05, 7.331371307373047e-05, 0.00021529197692871094, 0.0003572702407836914, 0.0004992485046386719, 0.0006412267684936523, 0.0007832050323486328, 0.0009251832962036133, 0.0010671615600585938, 0.0012091398239135742, 0.0013511180877685547, 0.0014930963516235352, 0.0016350746154785156, 0.001777052879333496, 0.0019190311431884766, 0.002061009407043457, 0.0022029876708984375, 0.002344965934753418, 0.0024869441986083984, 0.002628922462463379, 0.0027709007263183594, 0.00291287899017334, 0.0030548572540283203, 0.0031968355178833008, 0.0033388137817382812, 0.0034807920455932617, 0.003622770309448242, 0.0037647485733032227, 0.003906726837158203, 0.004048705101013184, 0.004190683364868164, 0.0043326616287231445, 0.004474639892578125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 8.0, 159.0, 810.0, 39.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04298434779047966, -0.029278934001922607, -0.015573520213365555, -0.0018681064248085022, 0.01183730736374855, 0.0255427248775959, 0.039248134940862656, 0.05295354500412941, 0.06665895879268646, 0.08036437630653381, 0.09406978636980057, 0.10777519643306732, 0.12148061394691467, 0.13518603146076202, 0.14889144897460938, 0.16259685158729553, 0.17630226910114288, 0.19000768661499023, 0.2037130892276764, 0.21741850674152374, 0.2311239242553711, 0.24482934176921844, 0.2585347592830658, 0.27224016189575195, 0.2859455943107605, 0.29965099692344666, 0.3133564293384552, 0.32706183195114136, 0.3407672643661499, 0.35447266697883606, 0.3681780695915222, 0.38188350200653076, 0.39558887481689453, 0.4092942774295807, 0.42299970984458923, 0.4367051124572754, 0.45041054487228394, 0.4641159474849701, 0.47782135009765625, 0.4915267825126648, 0.5052322149276733, 0.5189376473426819, 0.5326430201530457, 0.5463484525680542, 0.5600538849830627, 0.5737593173980713, 0.5874646902084351, 0.6011701226234436, 0.6148754954338074, 0.6285809278488159, 0.6422863006591797, 0.6559917330741882, 0.6696971654891968, 0.6834025382995605, 0.6971079707145691, 0.7108134031295776, 0.7245187759399414, 0.73822420835495, 0.7519295811653137, 0.7656350135803223, 0.7793404459953308, 0.7930458784103394, 0.8067512512207031, 0.8204566836357117, 0.8341621160507202]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 12.0, 10.0, 21.0, 33.0, 58.0, 88.0, 102.0, 122.0, 120.0, 103.0, 106.0, 79.0, 56.0, 38.0, 24.0, 11.0, 9.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02246958017349243, -0.02055458351969719, -0.018639585003256798, -0.016724586486816406, -0.014809589833021164, -0.012894592247903347, -0.01097959466278553, -0.009064597077667713, -0.007149599492549896, -0.005234601907432079, -0.0033196043223142624, -0.0014046067371964455, 0.0005103908479213715, 0.0024253884330391884, 0.004340386018157005, 0.006255383603274822, 0.00817038118839264, 0.010085378773510456, 0.012000376358628273, 0.01391537394374609, 0.015830371528863907, 0.01774536818265915, 0.01966036669909954, 0.021575365215539932, 0.023490361869335175, 0.025405358523130417, 0.02732035703957081, 0.0292353555560112, 0.031150352209806442, 0.033065348863601685, 0.034980349242687225, 0.03689534589648247, 0.03881034255027771, 0.04072533920407295, 0.042640335857868195, 0.044555336236953735, 0.04647033289074898, 0.04838532954454422, 0.05030032992362976, 0.052215326577425, 0.054130323231220245, 0.05604531988501549, 0.05796031653881073, 0.05987531691789627, 0.06179031357169151, 0.06370531022548676, 0.0656203106045723, 0.06753530353307724, 0.06945030391216278, 0.07136530429124832, 0.07328029721975327, 0.0751952975988388, 0.07711029052734375, 0.07902529090642929, 0.08094029128551483, 0.08285528421401978, 0.08477028459310532, 0.08668528497219086, 0.0886002779006958, 0.09051527827978134, 0.09243027865886688, 0.09434527158737183, 0.09626027196645737, 0.09817526489496231, 0.10009026527404785]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 4.0, 4.0, 8.0, 12.0, 15.0, 23.0, 18.0, 39.0, 25.0, 39.0, 78.0, 225.0, 923.0, 5108.0, 47532.0, 956079.0, 33027.0, 4113.0, 798.0, 206.0, 80.0, 47.0, 30.0, 26.0, 15.0, 9.0, 19.0, 9.0, 10.0, 3.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08380126953125, -0.08104801177978516, -0.07829475402832031, -0.07554149627685547, -0.07278823852539062, -0.07003498077392578, -0.06728172302246094, -0.0645284652709961, -0.06177520751953125, -0.059021949768066406, -0.05626869201660156, -0.05351543426513672, -0.050762176513671875, -0.04800891876220703, -0.04525566101074219, -0.042502403259277344, -0.0397491455078125, -0.036995887756347656, -0.03424263000488281, -0.03148937225341797, -0.028736114501953125, -0.02598285675048828, -0.023229598999023438, -0.020476341247558594, -0.01772308349609375, -0.014969825744628906, -0.012216567993164062, -0.009463310241699219, -0.006710052490234375, -0.003956794738769531, -0.0012035369873046875, 0.0015497207641601562, 0.004302978515625, 0.007056236267089844, 0.009809494018554688, 0.012562751770019531, 0.015316009521484375, 0.01806926727294922, 0.020822525024414062, 0.023575782775878906, 0.02632904052734375, 0.029082298278808594, 0.03183555603027344, 0.03458881378173828, 0.037342071533203125, 0.04009532928466797, 0.04284858703613281, 0.045601844787597656, 0.0483551025390625, 0.051108360290527344, 0.05386161804199219, 0.05661487579345703, 0.059368133544921875, 0.06212139129638672, 0.06487464904785156, 0.0676279067993164, 0.07038116455078125, 0.0731344223022461, 0.07588768005371094, 0.07864093780517578, 0.08139419555664062, 0.08414745330810547, 0.08690071105957031, 0.08965396881103516, 0.0924072265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 4.0, 0.0, 8.0, 9.0, 17.0, 28.0, 84.0, 253.0, 328.0, 162.0, 46.0, 24.0, 13.0, 18.0, 5.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00287628173828125, -0.0026438236236572266, -0.002411365509033203, -0.0021789073944091797, -0.0019464492797851562, -0.0017139911651611328, -0.0014815330505371094, -0.001249074935913086, -0.0010166168212890625, -0.0007841587066650391, -0.0005517005920410156, -0.0003192424774169922, -8.678436279296875e-05, 0.0001456737518310547, 0.0003781318664550781, 0.0006105899810791016, 0.000843048095703125, 0.0010755062103271484, 0.0013079643249511719, 0.0015404224395751953, 0.0017728805541992188, 0.002005338668823242, 0.0022377967834472656, 0.002470254898071289, 0.0027027130126953125, 0.002935171127319336, 0.0031676292419433594, 0.003400087356567383, 0.0036325454711914062, 0.0038650035858154297, 0.004097461700439453, 0.0043299198150634766, 0.0045623779296875, 0.0047948360443115234, 0.005027294158935547, 0.00525975227355957, 0.005492210388183594, 0.005724668502807617, 0.005957126617431641, 0.006189584732055664, 0.0064220428466796875, 0.006654500961303711, 0.006886959075927734, 0.007119417190551758, 0.007351875305175781, 0.007584333419799805, 0.007816791534423828, 0.008049249649047852, 0.008281707763671875, 0.008514165878295898, 0.008746623992919922, 0.008979082107543945, 0.009211540222167969, 0.009443998336791992, 0.009676456451416016, 0.009908914566040039, 0.010141372680664062, 0.010373830795288086, 0.01060628890991211, 0.010838747024536133, 0.011071205139160156, 0.01130366325378418, 0.011536121368408203, 0.011768579483032227, 0.01200103759765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 10.0, 11.0, 16.0, 15.0, 20.0, 27.0, 31.0, 25.0, 55.0, 84.0, 384.0, 3499.0, 357317.0, 680882.0, 5350.0, 477.0, 123.0, 42.0, 23.0, 27.0, 35.0, 12.0, 17.0, 15.0, 3.0, 13.0, 8.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0821533203125, -0.07922554016113281, -0.07629776000976562, -0.07336997985839844, -0.07044219970703125, -0.06751441955566406, -0.06458663940429688, -0.06165885925292969, -0.0587310791015625, -0.05580329895019531, -0.052875518798828125, -0.04994773864746094, -0.04701995849609375, -0.04409217834472656, -0.041164398193359375, -0.03823661804199219, -0.035308837890625, -0.03238105773925781, -0.029453277587890625, -0.026525497436523438, -0.02359771728515625, -0.020669937133789062, -0.017742156982421875, -0.014814376831054688, -0.0118865966796875, -0.008958816528320312, -0.006031036376953125, -0.0031032562255859375, -0.00017547607421875, 0.0027523040771484375, 0.005680084228515625, 0.008607864379882812, 0.01153564453125, 0.014463424682617188, 0.017391204833984375, 0.020318984985351562, 0.02324676513671875, 0.026174545288085938, 0.029102325439453125, 0.03203010559082031, 0.0349578857421875, 0.03788566589355469, 0.040813446044921875, 0.04374122619628906, 0.04666900634765625, 0.04959678649902344, 0.052524566650390625, 0.05545234680175781, 0.058380126953125, 0.06130790710449219, 0.06423568725585938, 0.06716346740722656, 0.07009124755859375, 0.07301902770996094, 0.07594680786132812, 0.07887458801269531, 0.0818023681640625, 0.08473014831542969, 0.08765792846679688, 0.09058570861816406, 0.09351348876953125, 0.09644126892089844, 0.09936904907226562, 0.10229682922363281, 0.105224609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 13.0, 11.0, 11.0, 14.0, 16.0, 22.0, 20.0, 22.0, 27.0, 19.0, 37.0, 36.0, 36.0, 46.0, 42.0, 40.0, 51.0, 64.0, 44.0, 42.0, 44.0, 34.0, 27.0, 26.0, 27.0, 29.0, 19.0, 28.0, 32.0, 21.0, 18.0, 10.0, 15.0, 9.0, 12.0, 4.0, 6.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01145172119140625, -0.01109921932220459, -0.01074671745300293, -0.01039421558380127, -0.01004171371459961, -0.00968921184539795, -0.009336709976196289, -0.008984208106994629, -0.008631706237792969, -0.008279204368591309, -0.007926702499389648, -0.007574200630187988, -0.007221698760986328, -0.006869196891784668, -0.006516695022583008, -0.006164193153381348, -0.0058116912841796875, -0.005459189414978027, -0.005106687545776367, -0.004754185676574707, -0.004401683807373047, -0.004049181938171387, -0.0036966800689697266, -0.0033441781997680664, -0.0029916763305664062, -0.002639174461364746, -0.002286672592163086, -0.0019341707229614258, -0.0015816688537597656, -0.0012291669845581055, -0.0008766651153564453, -0.0005241632461547852, -0.000171661376953125, 0.00018084049224853516, 0.0005333423614501953, 0.0008858442306518555, 0.0012383460998535156, 0.0015908479690551758, 0.001943349838256836, 0.002295851707458496, 0.0026483535766601562, 0.0030008554458618164, 0.0033533573150634766, 0.0037058591842651367, 0.004058361053466797, 0.004410862922668457, 0.004763364791870117, 0.005115866661071777, 0.0054683685302734375, 0.005820870399475098, 0.006173372268676758, 0.006525874137878418, 0.006878376007080078, 0.007230877876281738, 0.0075833797454833984, 0.007935881614685059, 0.008288383483886719, 0.008640885353088379, 0.008993387222290039, 0.0093458890914917, 0.00969839096069336, 0.01005089282989502, 0.01040339469909668, 0.01075589656829834, 0.0111083984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 10.0, 14.0, 36.0, 89.0, 381.0, 8923.0, 1037235.0, 1554.0, 183.0, 57.0, 22.0, 11.0, 8.0, 5.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2335205078125, -0.2258167266845703, -0.21811294555664062, -0.21040916442871094, -0.20270538330078125, -0.19500160217285156, -0.18729782104492188, -0.1795940399169922, -0.1718902587890625, -0.1641864776611328, -0.15648269653320312, -0.14877891540527344, -0.14107513427734375, -0.13337135314941406, -0.12566757202148438, -0.11796379089355469, -0.110260009765625, -0.10255622863769531, -0.09485244750976562, -0.08714866638183594, -0.07944488525390625, -0.07174110412597656, -0.06403732299804688, -0.05633354187011719, -0.0486297607421875, -0.04092597961425781, -0.033222198486328125, -0.025518417358398438, -0.01781463623046875, -0.010110855102539062, -0.002407073974609375, 0.0052967071533203125, 0.01300048828125, 0.020704269409179688, 0.028408050537109375, 0.03611183166503906, 0.04381561279296875, 0.05151939392089844, 0.059223175048828125, 0.06692695617675781, 0.0746307373046875, 0.08233451843261719, 0.09003829956054688, 0.09774208068847656, 0.10544586181640625, 0.11314964294433594, 0.12085342407226562, 0.1285572052001953, 0.136260986328125, 0.1439647674560547, 0.15166854858398438, 0.15937232971191406, 0.16707611083984375, 0.17477989196777344, 0.18248367309570312, 0.1901874542236328, 0.1978912353515625, 0.2055950164794922, 0.21329879760742188, 0.22100257873535156, 0.22870635986328125, 0.23641014099121094, 0.24411392211914062, 0.2518177032470703, 0.259521484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 6.0, 16.0, 20.0, 41.0, 74.0, 361.0, 295.0, 58.0, 33.0, 14.0, 14.0, 12.0, 12.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0029010772705078125, -0.0028318464756011963, -0.00276261568069458, -0.002693384885787964, -0.0026241540908813477, -0.0025549232959747314, -0.0024856925010681152, -0.002416461706161499, -0.002347230911254883, -0.0022780001163482666, -0.0022087693214416504, -0.002139538526535034, -0.002070307731628418, -0.0020010769367218018, -0.0019318461418151855, -0.0018626153469085693, -0.0017933845520019531, -0.001724153757095337, -0.0016549229621887207, -0.0015856921672821045, -0.0015164613723754883, -0.001447230577468872, -0.0013779997825622559, -0.0013087689876556396, -0.0012395381927490234, -0.0011703073978424072, -0.001101076602935791, -0.0010318458080291748, -0.0009626150131225586, -0.0008933842182159424, -0.0008241534233093262, -0.00075492262840271, -0.0006856918334960938, -0.0006164610385894775, -0.0005472302436828613, -0.0004779994487762451, -0.0004087686538696289, -0.0003395378589630127, -0.0002703070640563965, -0.00020107626914978027, -0.00013184547424316406, -6.261467933654785e-05, 6.616115570068359e-06, 7.584691047668457e-05, 0.00014507770538330078, 0.000214308500289917, 0.0002835392951965332, 0.0003527700901031494, 0.0004220008850097656, 0.0004912316799163818, 0.000560462474822998, 0.0006296932697296143, 0.0006989240646362305, 0.0007681548595428467, 0.0008373856544494629, 0.0009066164493560791, 0.0009758472442626953, 0.0010450780391693115, 0.0011143088340759277, 0.001183539628982544, 0.0012527704238891602, 0.0013220012187957764, 0.0013912320137023926, 0.0014604628086090088, 0.001529693603515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 12.0, 11.0, 19.0, 30.0, 34.0, 55.0, 85.0, 173.0, 319.0, 714.0, 2163.0, 9456.0, 95604.0, 884027.0, 46422.0, 6376.0, 1694.0, 645.0, 259.0, 178.0, 90.0, 72.0, 30.0, 28.0, 16.0, 14.0, 3.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062225341796875, -0.06041574478149414, -0.05860614776611328, -0.05679655075073242, -0.05498695373535156, -0.0531773567199707, -0.051367759704589844, -0.049558162689208984, -0.047748565673828125, -0.045938968658447266, -0.044129371643066406, -0.04231977462768555, -0.04051017761230469, -0.03870058059692383, -0.03689098358154297, -0.03508138656616211, -0.03327178955078125, -0.03146219253540039, -0.02965259552001953, -0.027842998504638672, -0.026033401489257812, -0.024223804473876953, -0.022414207458496094, -0.020604610443115234, -0.018795013427734375, -0.016985416412353516, -0.015175819396972656, -0.013366222381591797, -0.011556625366210938, -0.009747028350830078, -0.007937431335449219, -0.006127834320068359, -0.0043182373046875, -0.0025086402893066406, -0.0006990432739257812, 0.0011105537414550781, 0.0029201507568359375, 0.004729747772216797, 0.006539344787597656, 0.008348941802978516, 0.010158538818359375, 0.011968135833740234, 0.013777732849121094, 0.015587329864501953, 0.017396926879882812, 0.019206523895263672, 0.02101612091064453, 0.02282571792602539, 0.02463531494140625, 0.02644491195678711, 0.02825450897216797, 0.030064105987548828, 0.03187370300292969, 0.03368330001831055, 0.035492897033691406, 0.037302494049072266, 0.039112091064453125, 0.040921688079833984, 0.042731285095214844, 0.0445408821105957, 0.04635047912597656, 0.04816007614135742, 0.04996967315673828, 0.05177927017211914, 0.0535888671875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 5.0, 4.0, 5.0, 6.0, 13.0, 15.0, 21.0, 21.0, 41.0, 69.0, 95.0, 136.0, 153.0, 139.0, 93.0, 61.0, 38.0, 18.0, 15.0, 14.0, 13.0, 7.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01352691650390625, -0.012825369834899902, -0.012123823165893555, -0.011422276496887207, -0.01072072982788086, -0.010019183158874512, -0.009317636489868164, -0.008616089820861816, -0.007914543151855469, -0.007212996482849121, -0.0065114498138427734, -0.005809903144836426, -0.005108356475830078, -0.0044068098068237305, -0.003705263137817383, -0.003003716468811035, -0.0023021697998046875, -0.0016006231307983398, -0.0008990764617919922, -0.00019752979278564453, 0.0005040168762207031, 0.0012055635452270508, 0.0019071102142333984, 0.002608656883239746, 0.0033102035522460938, 0.004011750221252441, 0.004713296890258789, 0.005414843559265137, 0.006116390228271484, 0.006817936897277832, 0.00751948356628418, 0.008221030235290527, 0.008922576904296875, 0.009624123573303223, 0.01032567024230957, 0.011027216911315918, 0.011728763580322266, 0.012430310249328613, 0.013131856918334961, 0.013833403587341309, 0.014534950256347656, 0.015236496925354004, 0.01593804359436035, 0.0166395902633667, 0.017341136932373047, 0.018042683601379395, 0.018744230270385742, 0.01944577693939209, 0.020147323608398438, 0.020848870277404785, 0.021550416946411133, 0.02225196361541748, 0.022953510284423828, 0.023655056953430176, 0.024356603622436523, 0.02505815029144287, 0.02575969696044922, 0.026461243629455566, 0.027162790298461914, 0.02786433696746826, 0.02856588363647461, 0.029267430305480957, 0.029968976974487305, 0.030670523643493652, 0.0313720703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 10.0, 16.0, 43.0, 88.0, 184.0, 261.0, 211.0, 98.0, 31.0, 19.0, 11.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19143696129322052, -0.1858953833580017, -0.1803537905216217, -0.1748121976852417, -0.1692706197500229, -0.16372904181480408, -0.15818744897842407, -0.15264585614204407, -0.14710427820682526, -0.14156270027160645, -0.13602110743522644, -0.13047951459884644, -0.12493793666362762, -0.11939635127782822, -0.11385476589202881, -0.1083131805062294, -0.10277159512042999, -0.09723000973463058, -0.09168842434883118, -0.08614683896303177, -0.08060525357723236, -0.07506366819143295, -0.06952208280563354, -0.06398049741983414, -0.05843891203403473, -0.05289732664823532, -0.04735574126243591, -0.041814155876636505, -0.0362725704908371, -0.03073098510503769, -0.02518939971923828, -0.019647814333438873, -0.01410624384880066, -0.008564658463001251, -0.0030230730772018433, 0.0025185123085975647, 0.008060097694396973, 0.01360168308019638, 0.01914326846599579, 0.024684853851795197, 0.030226439237594604, 0.03576802462339401, 0.04130961000919342, 0.04685119539499283, 0.052392780780792236, 0.057934366166591644, 0.06347595155239105, 0.06901753693819046, 0.07455912232398987, 0.08010070770978928, 0.08564229309558868, 0.09118387848138809, 0.0967254638671875, 0.10226704925298691, 0.10780863463878632, 0.11335022002458572, 0.11889180541038513, 0.12443339079618454, 0.12997497618198395, 0.13551655411720276, 0.14105814695358276, 0.14659973978996277, 0.15214131772518158, 0.1576828956604004, 0.1632244884967804]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 4.0, 16.0, 19.0, 26.0, 34.0, 55.0, 100.0, 86.0, 130.0, 131.0, 93.0, 87.0, 70.0, 36.0, 38.0, 24.0, 16.0, 7.0, 6.0, 7.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22065919637680054, -0.2150178849697113, -0.20937658846378326, -0.20373529195785522, -0.198093980550766, -0.19245266914367676, -0.18681137263774872, -0.18117007613182068, -0.17552876472473145, -0.1698874533176422, -0.16424615681171417, -0.15860486030578613, -0.1529635488986969, -0.14732223749160767, -0.14168094098567963, -0.1360396444797516, -0.13039833307266235, -0.12475702911615372, -0.11911572515964508, -0.11347442120313644, -0.10783311724662781, -0.10219181329011917, -0.09655050933361053, -0.0909092053771019, -0.08526790142059326, -0.07962659746408463, -0.07398529350757599, -0.06834398955106735, -0.06270268559455872, -0.05706138163805008, -0.05142007768154144, -0.045778773725032806, -0.04013746976852417, -0.03449616581201553, -0.028854861855506897, -0.02321355789899826, -0.017572253942489624, -0.011930949985980988, -0.006289646029472351, -0.0006483420729637146, 0.004992961883544922, 0.010634265840053558, 0.016275569796562195, 0.02191687375307083, 0.027558177709579468, 0.033199481666088104, 0.03884078562259674, 0.04448208957910538, 0.050123393535614014, 0.05576469749212265, 0.06140600144863129, 0.06704730540513992, 0.07268860936164856, 0.0783299133181572, 0.08397121727466583, 0.08961252123117447, 0.0952538251876831, 0.10089512914419174, 0.10653643310070038, 0.11217773705720901, 0.11781904101371765, 0.12346034497022629, 0.12910164892673492, 0.13474294543266296, 0.1403842568397522]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 0.0, 2.0, 6.0, 0.0, 4.0, 6.0, 6.0, 8.0, 10.0, 6.0, 4.0, 8.0, 6.0, 14.0, 8.0, 16.0, 6.0, 16.0, 23.0, 43.0, 212.0, 26896.0, 4166108.0, 612.0, 70.0, 35.0, 17.0, 26.0, 20.0, 18.0, 11.0, 13.0, 10.0, 8.0, 8.0, 10.0, 6.0, 2.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.67822265625, -0.6604537963867188, -0.6426849365234375, -0.6249160766601562, -0.607147216796875, -0.5893783569335938, -0.5716094970703125, -0.5538406372070312, -0.53607177734375, -0.5183029174804688, -0.5005340576171875, -0.48276519775390625, -0.464996337890625, -0.44722747802734375, -0.4294586181640625, -0.41168975830078125, -0.3939208984375, -0.37615203857421875, -0.3583831787109375, -0.34061431884765625, -0.322845458984375, -0.30507659912109375, -0.2873077392578125, -0.26953887939453125, -0.25177001953125, -0.23400115966796875, -0.2162322998046875, -0.19846343994140625, -0.180694580078125, -0.16292572021484375, -0.1451568603515625, -0.12738800048828125, -0.109619140625, -0.09185028076171875, -0.0740814208984375, -0.05631256103515625, -0.038543701171875, -0.02077484130859375, -0.0030059814453125, 0.01476287841796875, 0.03253173828125, 0.05030059814453125, 0.0680694580078125, 0.08583831787109375, 0.103607177734375, 0.12137603759765625, 0.1391448974609375, 0.15691375732421875, 0.1746826171875, 0.19245147705078125, 0.2102203369140625, 0.22798919677734375, 0.245758056640625, 0.26352691650390625, 0.2812957763671875, 0.29906463623046875, 0.31683349609375, 0.33460235595703125, 0.3523712158203125, 0.37014007568359375, 0.387908935546875, 0.40567779541015625, 0.4234466552734375, 0.44121551513671875, 0.458984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 11.0, 8.0, 10.0, 17.0, 25.0, 57.0, 91.0, 115.0, 142.0, 145.0, 107.0, 77.0, 61.0, 30.0, 26.0, 17.0, 18.0, 15.0, 3.0, 7.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003326416015625, -0.003219783306121826, -0.0031131505966186523, -0.0030065178871154785, -0.0028998851776123047, -0.002793252468109131, -0.002686619758605957, -0.002579987049102783, -0.0024733543395996094, -0.0023667216300964355, -0.0022600889205932617, -0.002153456211090088, -0.002046823501586914, -0.0019401907920837402, -0.0018335580825805664, -0.0017269253730773926, -0.0016202926635742188, -0.001513659954071045, -0.001407027244567871, -0.0013003945350646973, -0.0011937618255615234, -0.0010871291160583496, -0.0009804964065551758, -0.000873863697052002, -0.0007672309875488281, -0.0006605982780456543, -0.0005539655685424805, -0.00044733285903930664, -0.0003407001495361328, -0.00023406744003295898, -0.00012743473052978516, -2.0802021026611328e-05, 8.58306884765625e-05, 0.00019246339797973633, 0.00029909610748291016, 0.000405728816986084, 0.0005123615264892578, 0.0006189942359924316, 0.0007256269454956055, 0.0008322596549987793, 0.0009388923645019531, 0.001045525074005127, 0.0011521577835083008, 0.0012587904930114746, 0.0013654232025146484, 0.0014720559120178223, 0.001578688621520996, 0.00168532133102417, 0.0017919540405273438, 0.0018985867500305176, 0.0020052194595336914, 0.0021118521690368652, 0.002218484878540039, 0.002325117588043213, 0.0024317502975463867, 0.0025383830070495605, 0.0026450157165527344, 0.002751648426055908, 0.002858281135559082, 0.002964913845062256, 0.0030715465545654297, 0.0031781792640686035, 0.0032848119735717773, 0.003391444683074951, 0.003498077392578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 8.0, 18.0, 9.0, 28.0, 35.0, 61.0, 80.0, 121.0, 188.0, 223.0, 570.0, 3211691.0, 979834.0, 574.0, 215.0, 147.0, 143.0, 118.0, 64.0, 52.0, 45.0, 12.0, 17.0, 7.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.208740234375, -0.19879150390625, -0.1888427734375, -0.17889404296875, -0.1689453125, -0.15899658203125, -0.1490478515625, -0.13909912109375, -0.129150390625, -0.11920166015625, -0.1092529296875, -0.09930419921875, -0.08935546875, -0.07940673828125, -0.0694580078125, -0.05950927734375, -0.049560546875, -0.03961181640625, -0.0296630859375, -0.01971435546875, -0.009765625, 0.00018310546875, 0.0101318359375, 0.02008056640625, 0.030029296875, 0.03997802734375, 0.0499267578125, 0.05987548828125, 0.06982421875, 0.07977294921875, 0.0897216796875, 0.09967041015625, 0.109619140625, 0.11956787109375, 0.1295166015625, 0.13946533203125, 0.1494140625, 0.15936279296875, 0.1693115234375, 0.17926025390625, 0.189208984375, 0.19915771484375, 0.2091064453125, 0.21905517578125, 0.22900390625, 0.23895263671875, 0.2489013671875, 0.25885009765625, 0.268798828125, 0.27874755859375, 0.2886962890625, 0.29864501953125, 0.30859375, 0.31854248046875, 0.3284912109375, 0.33843994140625, 0.348388671875, 0.35833740234375, 0.3682861328125, 0.37823486328125, 0.38818359375, 0.39813232421875, 0.4080810546875, 0.41802978515625, 0.427978515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 7.0, 33.0, 125.0, 2498.0, 1295.0, 88.0, 32.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005390167236328125, -0.0044800639152526855, -0.003569960594177246, -0.0026598572731018066, -0.0017497539520263672, -0.0008396506309509277, 7.045269012451172e-05, 0.0009805560111999512, 0.0018906593322753906, 0.00280076265335083, 0.0037108659744262695, 0.004620969295501709, 0.0055310726165771484, 0.006441175937652588, 0.007351279258728027, 0.008261382579803467, 0.009171485900878906, 0.010081589221954346, 0.010991692543029785, 0.011901795864105225, 0.012811899185180664, 0.013722002506256104, 0.014632105827331543, 0.015542209148406982, 0.016452312469482422, 0.01736241579055786, 0.0182725191116333, 0.01918262243270874, 0.02009272575378418, 0.02100282907485962, 0.02191293239593506, 0.022823035717010498, 0.023733139038085938, 0.024643242359161377, 0.025553345680236816, 0.026463449001312256, 0.027373552322387695, 0.028283655643463135, 0.029193758964538574, 0.030103862285614014, 0.031013965606689453, 0.03192406892776489, 0.03283417224884033, 0.03374427556991577, 0.03465437889099121, 0.03556448221206665, 0.03647458553314209, 0.03738468885421753, 0.03829479217529297, 0.03920489549636841, 0.04011499881744385, 0.04102510213851929, 0.04193520545959473, 0.042845308780670166, 0.043755412101745605, 0.044665515422821045, 0.045575618743896484, 0.046485722064971924, 0.04739582538604736, 0.0483059287071228, 0.04921603202819824, 0.05012613534927368, 0.05103623867034912, 0.05194634199142456, 0.0528564453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 26.0, 119.0, 649.0, 176.0, 18.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5053959488868713, -0.48323574662208557, -0.4610755145549774, -0.43891531229019165, -0.4167550802230835, -0.39459487795829773, -0.37243467569351196, -0.3502744436264038, -0.32811424136161804, -0.3059540390968323, -0.2837938070297241, -0.26163360476493835, -0.2394733875989914, -0.21731317043304443, -0.19515296816825867, -0.1729927510023117, -0.15083253383636475, -0.12867231667041779, -0.10651210695505142, -0.08435189723968506, -0.0621916800737381, -0.04003146290779114, -0.01787126064300537, 0.004288956522941589, 0.02644917368888855, 0.04860938712954521, 0.07076960057020187, 0.09292981028556824, 0.1150900274515152, 0.13725024461746216, 0.15941044688224792, 0.18157066404819489, 0.20373082160949707, 0.22589103877544403, 0.248051255941391, 0.27021145820617676, 0.2923716902732849, 0.3145318925380707, 0.33669209480285645, 0.3588523268699646, 0.38101252913475037, 0.40317273139953613, 0.4253329634666443, 0.44749316573143005, 0.4696533679962158, 0.491813600063324, 0.5139738321304321, 0.5361340045928955, 0.5582942366600037, 0.5804544687271118, 0.6026146411895752, 0.6247748732566833, 0.6469351053237915, 0.6690952777862549, 0.691255509853363, 0.7134157419204712, 0.7355759143829346, 0.7577361464500427, 0.7798963189125061, 0.8020565509796143, 0.8242167830467224, 0.8463770151138306, 0.868537187576294, 0.8906974196434021, 0.9128576517105103]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 12.0, 27.0, 89.0, 165.0, 271.0, 231.0, 130.0, 59.0, 23.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22550296783447266, -0.20513667166233063, -0.1847703754901886, -0.16440406441688538, -0.14403776824474335, -0.12367147207260132, -0.10330516844987869, -0.08293886482715607, -0.06257256865501404, -0.04220626875758171, -0.021839968860149384, -0.0014736689627170563, 0.01889263093471527, 0.0392589271068573, 0.059625230729579926, 0.07999153435230255, 0.10035783052444458, 0.12072412669658661, 0.14109042286872864, 0.16145673394203186, 0.1818230301141739, 0.20218932628631592, 0.22255563735961914, 0.24292193353176117, 0.2632882297039032, 0.2836545407772064, 0.30402082204818726, 0.3243871331214905, 0.3447534441947937, 0.36511972546577454, 0.38548603653907776, 0.4058523178100586, 0.4262186288833618, 0.44658493995666504, 0.4669512212276459, 0.4873175323009491, 0.5076838135719299, 0.5280501246452332, 0.5484164357185364, 0.5687827467918396, 0.589148998260498, 0.6095153093338013, 0.6298816204071045, 0.6502478718757629, 0.6706141829490662, 0.6909804940223694, 0.7113468050956726, 0.7317131161689758, 0.752079427242279, 0.7724457383155823, 0.7928120493888855, 0.813178300857544, 0.8335446119308472, 0.8539109230041504, 0.8742772340774536, 0.8946435451507568, 0.9150098562240601, 0.9353761672973633, 0.9557424783706665, 0.976108729839325, 0.9964750409126282, 1.0168414115905762, 1.0372076034545898, 1.057573914527893, 1.0779402256011963]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 6.0, 6.0, 8.0, 10.0, 16.0, 19.0, 23.0, 30.0, 33.0, 39.0, 50.0, 46.0, 52.0, 57.0, 90.0, 1047111.0, 533.0, 64.0, 69.0, 55.0, 38.0, 35.0, 23.0, 28.0, 13.0, 17.0, 16.0, 10.0, 10.0, 10.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.17578125, -2.1163482666015625, -2.056915283203125, -1.9974822998046875, -1.93804931640625, -1.8786163330078125, -1.819183349609375, -1.7597503662109375, -1.7003173828125, -1.6408843994140625, -1.581451416015625, -1.5220184326171875, -1.46258544921875, -1.4031524658203125, -1.343719482421875, -1.2842864990234375, -1.224853515625, -1.1654205322265625, -1.105987548828125, -1.0465545654296875, -0.98712158203125, -0.9276885986328125, -0.868255615234375, -0.8088226318359375, -0.7493896484375, -0.6899566650390625, -0.630523681640625, -0.5710906982421875, -0.51165771484375, -0.4522247314453125, -0.392791748046875, -0.3333587646484375, -0.27392578125, -0.2144927978515625, -0.155059814453125, -0.0956268310546875, -0.03619384765625, 0.0232391357421875, 0.082672119140625, 0.1421051025390625, 0.2015380859375, 0.2609710693359375, 0.320404052734375, 0.3798370361328125, 0.43927001953125, 0.4987030029296875, 0.558135986328125, 0.6175689697265625, 0.677001953125, 0.7364349365234375, 0.795867919921875, 0.8553009033203125, 0.91473388671875, 0.9741668701171875, 1.033599853515625, 1.0930328369140625, 1.1524658203125, 1.2118988037109375, 1.271331787109375, 1.3307647705078125, 1.39019775390625, 1.4496307373046875, 1.509063720703125, 1.5684967041015625, 1.6279296875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [50.0, 766.0, 202.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00855255126953125, -0.0037001371383666992, 0.0011522769927978516, 0.006004691123962402, 0.010857105255126953, 0.015709519386291504, 0.020561933517456055, 0.025414347648620605, 0.030266761779785156, 0.03511917591094971, 0.03997159004211426, 0.04482400417327881, 0.04967641830444336, 0.05452883243560791, 0.05938124656677246, 0.06423366069793701, 0.06908607482910156, 0.07393848896026611, 0.07879090309143066, 0.08364331722259521, 0.08849573135375977, 0.09334814548492432, 0.09820055961608887, 0.10305297374725342, 0.10790538787841797, 0.11275780200958252, 0.11761021614074707, 0.12246263027191162, 0.12731504440307617, 0.13216745853424072, 0.13701987266540527, 0.14187228679656982, 0.14672470092773438, 0.15157711505889893, 0.15642952919006348, 0.16128194332122803, 0.16613435745239258, 0.17098677158355713, 0.17583918571472168, 0.18069159984588623, 0.18554401397705078, 0.19039642810821533, 0.19524884223937988, 0.20010125637054443, 0.20495367050170898, 0.20980608463287354, 0.21465849876403809, 0.21951091289520264, 0.2243633270263672, 0.22921574115753174, 0.2340681552886963, 0.23892056941986084, 0.2437729835510254, 0.24862539768218994, 0.2534778118133545, 0.25833022594451904, 0.2631826400756836, 0.26803505420684814, 0.2728874683380127, 0.27773988246917725, 0.2825922966003418, 0.28744471073150635, 0.2922971248626709, 0.29714953899383545, 0.302001953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 5.0, 14.0, 10.0, 18.0, 23.0, 35.0, 55.0, 76.0, 139.0, 198.0, 323.0, 597.0, 1113.0, 2408.0, 5776.0, 17418.0, 65934.0, 572492.0, 310921.0, 48234.0, 13458.0, 4809.0, 2074.0, 1026.0, 559.0, 280.0, 176.0, 99.0, 80.0, 61.0, 41.0, 24.0, 20.0, 15.0, 11.0, 5.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.323974609375, -0.31412506103515625, -0.3042755126953125, -0.29442596435546875, -0.284576416015625, -0.27472686767578125, -0.2648773193359375, -0.25502777099609375, -0.24517822265625, -0.23532867431640625, -0.2254791259765625, -0.21562957763671875, -0.205780029296875, -0.19593048095703125, -0.1860809326171875, -0.17623138427734375, -0.1663818359375, -0.15653228759765625, -0.1466827392578125, -0.13683319091796875, -0.126983642578125, -0.11713409423828125, -0.1072845458984375, -0.09743499755859375, -0.08758544921875, -0.07773590087890625, -0.0678863525390625, -0.05803680419921875, -0.048187255859375, -0.03833770751953125, -0.0284881591796875, -0.01863861083984375, -0.0087890625, 0.00106048583984375, 0.0109100341796875, 0.02075958251953125, 0.030609130859375, 0.04045867919921875, 0.0503082275390625, 0.06015777587890625, 0.07000732421875, 0.07985687255859375, 0.0897064208984375, 0.09955596923828125, 0.109405517578125, 0.11925506591796875, 0.1291046142578125, 0.13895416259765625, 0.1488037109375, 0.15865325927734375, 0.1685028076171875, 0.17835235595703125, 0.188201904296875, 0.19805145263671875, 0.2079010009765625, 0.21775054931640625, 0.22760009765625, 0.23744964599609375, 0.2472991943359375, 0.25714874267578125, 0.266998291015625, 0.27684783935546875, 0.2866973876953125, 0.29654693603515625, 0.306396484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 8.0, 12.0, 15.0, 15.0, 18.0, 36.0, 36.0, 29.0, 40.0, 65.0, 85.0, 69.0, 68.0, 76.0, 68.0, 56.0, 59.0, 44.0, 44.0, 40.0, 20.0, 13.0, 19.0, 8.0, 12.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.263916015625, -0.25655364990234375, -0.2491912841796875, -0.24182891845703125, -0.234466552734375, -0.22710418701171875, -0.2197418212890625, -0.21237945556640625, -0.20501708984375, -0.19765472412109375, -0.1902923583984375, -0.18292999267578125, -0.175567626953125, -0.16820526123046875, -0.1608428955078125, -0.15348052978515625, -0.1461181640625, -0.13875579833984375, -0.1313934326171875, -0.12403106689453125, -0.116668701171875, -0.10930633544921875, -0.1019439697265625, -0.09458160400390625, -0.08721923828125, -0.07985687255859375, -0.0724945068359375, -0.06513214111328125, -0.057769775390625, -0.05040740966796875, -0.0430450439453125, -0.03568267822265625, -0.0283203125, -0.02095794677734375, -0.0135955810546875, -0.00623321533203125, 0.001129150390625, 0.00849151611328125, 0.0158538818359375, 0.02321624755859375, 0.03057861328125, 0.03794097900390625, 0.0453033447265625, 0.05266571044921875, 0.060028076171875, 0.06739044189453125, 0.0747528076171875, 0.08211517333984375, 0.0894775390625, 0.09683990478515625, 0.1042022705078125, 0.11156463623046875, 0.118927001953125, 0.12628936767578125, 0.1336517333984375, 0.14101409912109375, 0.14837646484375, 0.15573883056640625, 0.1631011962890625, 0.17046356201171875, 0.177825927734375, 0.18518829345703125, 0.1925506591796875, 0.19991302490234375, 0.207275390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 9.0, 22.0, 24.0, 37.0, 52.0, 85.0, 150.0, 271.0, 475.0, 1108.0, 3399.0, 15940.0, 245110.0, 739376.0, 33891.0, 5539.0, 1521.0, 663.0, 312.0, 195.0, 101.0, 80.0, 50.0, 31.0, 24.0, 18.0, 13.0, 10.0, 4.0, 5.0, 1.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.327880859375, -0.3176918029785156, -0.30750274658203125, -0.2973136901855469, -0.2871246337890625, -0.2769355773925781, -0.26674652099609375, -0.2565574645996094, -0.246368408203125, -0.23617935180664062, -0.22599029541015625, -0.21580123901367188, -0.2056121826171875, -0.19542312622070312, -0.18523406982421875, -0.17504501342773438, -0.16485595703125, -0.15466690063476562, -0.14447784423828125, -0.13428878784179688, -0.1240997314453125, -0.11391067504882812, -0.10372161865234375, -0.09353256225585938, -0.083343505859375, -0.07315444946289062, -0.06296539306640625, -0.052776336669921875, -0.0425872802734375, -0.032398223876953125, -0.02220916748046875, -0.012020111083984375, -0.0018310546875, 0.008358001708984375, 0.01854705810546875, 0.028736114501953125, 0.0389251708984375, 0.049114227294921875, 0.05930328369140625, 0.06949234008789062, 0.079681396484375, 0.08987045288085938, 0.10005950927734375, 0.11024856567382812, 0.1204376220703125, 0.13062667846679688, 0.14081573486328125, 0.15100479125976562, 0.16119384765625, 0.17138290405273438, 0.18157196044921875, 0.19176101684570312, 0.2019500732421875, 0.21213912963867188, 0.22232818603515625, 0.23251724243164062, 0.242706298828125, 0.2528953552246094, 0.26308441162109375, 0.2732734680175781, 0.2834625244140625, 0.2936515808105469, 0.30384063720703125, 0.3140296936035156, 0.32421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 10.0, 3.0, 6.0, 5.0, 7.0, 7.0, 12.0, 18.0, 20.0, 25.0, 47.0, 66.0, 96.0, 140.0, 149.0, 93.0, 76.0, 58.0, 49.0, 20.0, 19.0, 14.0, 7.0, 8.0, 11.0, 6.0, 6.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002460479736328125, -0.00023922696709632874, -0.00023240596055984497, -0.0002255849540233612, -0.00021876394748687744, -0.00021194294095039368, -0.0002051219344139099, -0.00019830092787742615, -0.00019147992134094238, -0.00018465891480445862, -0.00017783790826797485, -0.0001710169017314911, -0.00016419589519500732, -0.00015737488865852356, -0.0001505538821220398, -0.00014373287558555603, -0.00013691186904907227, -0.0001300908625125885, -0.00012326985597610474, -0.00011644884943962097, -0.00010962784290313721, -0.00010280683636665344, -9.598582983016968e-05, -8.916482329368591e-05, -8.234381675720215e-05, -7.552281022071838e-05, -6.870180368423462e-05, -6.188079714775085e-05, -5.505979061126709e-05, -4.8238784074783325e-05, -4.141777753829956e-05, -3.4596771001815796e-05, -2.777576446533203e-05, -2.0954757928848267e-05, -1.4133751392364502e-05, -7.312744855880737e-06, -4.917383193969727e-07, 6.329268217086792e-06, 1.3150274753570557e-05, 1.997128129005432e-05, 2.6792287826538086e-05, 3.361329436302185e-05, 4.0434300899505615e-05, 4.725530743598938e-05, 5.4076313972473145e-05, 6.089732050895691e-05, 6.771832704544067e-05, 7.453933358192444e-05, 8.13603401184082e-05, 8.818134665489197e-05, 9.500235319137573e-05, 0.0001018233597278595, 0.00010864436626434326, 0.00011546537280082703, 0.0001222863793373108, 0.00012910738587379456, 0.00013592839241027832, 0.00014274939894676208, 0.00014957040548324585, 0.00015639141201972961, 0.00016321241855621338, 0.00017003342509269714, 0.0001768544316291809, 0.00018367543816566467, 0.00019049644470214844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 14.0, 18.0, 39.0, 31.0, 56.0, 89.0, 146.0, 254.0, 515.0, 955.0, 2237.0, 5823.0, 22359.0, 576117.0, 410045.0, 20160.0, 5572.0, 2102.0, 929.0, 446.0, 239.0, 139.0, 73.0, 59.0, 31.0, 22.0, 19.0, 6.0, 12.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.50830078125, -0.4941673278808594, -0.48003387451171875, -0.4659004211425781, -0.4517669677734375, -0.4376335144042969, -0.42350006103515625, -0.4093666076660156, -0.395233154296875, -0.3810997009277344, -0.36696624755859375, -0.3528327941894531, -0.3386993408203125, -0.3245658874511719, -0.31043243408203125, -0.2962989807128906, -0.28216552734375, -0.2680320739746094, -0.25389862060546875, -0.23976516723632812, -0.2256317138671875, -0.21149826049804688, -0.19736480712890625, -0.18323135375976562, -0.169097900390625, -0.15496444702148438, -0.14083099365234375, -0.12669754028320312, -0.1125640869140625, -0.09843063354492188, -0.08429718017578125, -0.07016372680664062, -0.0560302734375, -0.041896820068359375, -0.02776336669921875, -0.013629913330078125, 0.0005035400390625, 0.014636993408203125, 0.02877044677734375, 0.042903900146484375, 0.057037353515625, 0.07117080688476562, 0.08530426025390625, 0.09943771362304688, 0.1135711669921875, 0.12770462036132812, 0.14183807373046875, 0.15597152709960938, 0.17010498046875, 0.18423843383789062, 0.19837188720703125, 0.21250534057617188, 0.2266387939453125, 0.24077224731445312, 0.25490570068359375, 0.2690391540527344, 0.283172607421875, 0.2973060607910156, 0.31143951416015625, 0.3255729675292969, 0.3397064208984375, 0.3538398742675781, 0.36797332763671875, 0.3821067810058594, 0.396240234375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 11.0, 6.0, 12.0, 15.0, 22.0, 34.0, 71.0, 248.0, 297.0, 130.0, 50.0, 25.0, 16.0, 11.0, 9.0, 6.0, 4.0, 7.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.286376953125, -0.27925682067871094, -0.2721366882324219, -0.2650165557861328, -0.25789642333984375, -0.2507762908935547, -0.24365615844726562, -0.23653602600097656, -0.2294158935546875, -0.22229576110839844, -0.21517562866210938, -0.2080554962158203, -0.20093536376953125, -0.1938152313232422, -0.18669509887695312, -0.17957496643066406, -0.172454833984375, -0.16533470153808594, -0.15821456909179688, -0.1510944366455078, -0.14397430419921875, -0.1368541717529297, -0.12973403930664062, -0.12261390686035156, -0.1154937744140625, -0.10837364196777344, -0.10125350952148438, -0.09413337707519531, -0.08701324462890625, -0.07989311218261719, -0.07277297973632812, -0.06565284729003906, -0.05853271484375, -0.05141258239746094, -0.044292449951171875, -0.03717231750488281, -0.03005218505859375, -0.022932052612304688, -0.015811920166015625, -0.008691787719726562, -0.0015716552734375, 0.0055484771728515625, 0.012668609619140625, 0.019788742065429688, 0.02690887451171875, 0.03402900695800781, 0.041149139404296875, 0.04826927185058594, 0.055389404296875, 0.06250953674316406, 0.06962966918945312, 0.07674980163574219, 0.08386993408203125, 0.09099006652832031, 0.09811019897460938, 0.10523033142089844, 0.1123504638671875, 0.11947059631347656, 0.12659072875976562, 0.1337108612060547, 0.14083099365234375, 0.1479511260986328, 0.15507125854492188, 0.16219139099121094, 0.1693115234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 11.0, 19.0, 42.0, 83.0, 315.0, 418.0, 90.0, 17.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587178945541382, -2.4654762744903564, -2.343773603439331, -2.2220709323883057, -2.1003682613372803, -1.9786655902862549, -1.8569629192352295, -1.735260248184204, -1.6135575771331787, -1.4918549060821533, -1.370152235031128, -1.2484495639801025, -1.1267468929290771, -1.0050442218780518, -0.8833415508270264, -0.761638879776001, -0.6399362087249756, -0.5182335376739502, -0.3965308666229248, -0.2748281955718994, -0.15312552452087402, -0.03142285346984863, 0.09027981758117676, 0.21198248863220215, 0.33368515968322754, 0.45538783073425293, 0.5770905017852783, 0.6987931728363037, 0.8204958438873291, 0.9421985149383545, 1.0639011859893799, 1.1856038570404053, 1.3073062896728516, 1.429008960723877, 1.5507116317749023, 1.6724143028259277, 1.7941169738769531, 1.9158196449279785, 2.037522315979004, 2.1592249870300293, 2.2809276580810547, 2.40263032913208, 2.5243330001831055, 2.646035671234131, 2.7677383422851562, 2.8894410133361816, 3.011143684387207, 3.1328463554382324, 3.254549026489258, 3.376251697540283, 3.4979543685913086, 3.619657039642334, 3.7413597106933594, 3.8630623817443848, 3.98476505279541, 4.1064677238464355, 4.228170394897461, 4.349873065948486, 4.471575736999512, 4.593278408050537, 4.7149810791015625, 4.836683750152588, 4.958386421203613, 5.080089092254639, 5.201791763305664]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 4.0, 13.0, 14.0, 12.0, 33.0, 30.0, 38.0, 45.0, 76.0, 83.0, 70.0, 85.0, 83.0, 71.0, 59.0, 64.0, 48.0, 44.0, 41.0, 29.0, 21.0, 14.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0924594402313232, -1.035036563873291, -0.977613627910614, -0.920190691947937, -0.8627678155899048, -0.8053449392318726, -0.7479220032691956, -0.6904990673065186, -0.6330761909484863, -0.5756533145904541, -0.5182303786277771, -0.4608074724674225, -0.40338456630706787, -0.34596166014671326, -0.28853875398635864, -0.23111584782600403, -0.17369294166564941, -0.1162700355052948, -0.058847129344940186, -0.0014242231845855713, 0.05599868297576904, 0.11342158913612366, 0.17084449529647827, 0.22826740145683289, 0.2856903076171875, 0.3431132137775421, 0.40053611993789673, 0.45795902609825134, 0.515381932258606, 0.5728048086166382, 0.6302277445793152, 0.6876506805419922, 0.7450735569000244, 0.8024964332580566, 0.8599193692207336, 0.9173423051834106, 0.9747651815414429, 1.032188057899475, 1.0896110534667969, 1.147033929824829, 1.2044568061828613, 1.2618796825408936, 1.3193025588989258, 1.3767255544662476, 1.4341484308242798, 1.491571307182312, 1.5489943027496338, 1.606417179107666, 1.6638400554656982, 1.7212629318237305, 1.7786858081817627, 1.8361088037490845, 1.8935316801071167, 1.950954556465149, 2.0083775520324707, 2.065800428390503, 2.123223304748535, 2.1806461811065674, 2.2380690574645996, 2.295491933822632, 2.352914810180664, 2.4103379249572754, 2.4677608013153076, 2.52518367767334, 2.582606554031372]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 35.0, 134.0, 13743.0, 4179190.0, 596.0, 237.0, 119.0, 92.0, 60.0, 36.0, 18.0, 21.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89111328125, -0.6778488159179688, -0.4645843505859375, -0.25131988525390625, -0.038055419921875, 0.17520904541015625, 0.3884735107421875, 0.6017379760742188, 0.81500244140625, 1.0282669067382812, 1.2415313720703125, 1.4547958374023438, 1.668060302734375, 1.8813247680664062, 2.0945892333984375, 2.3078536987304688, 2.5211181640625, 2.7343826293945312, 2.9476470947265625, 3.1609115600585938, 3.374176025390625, 3.5874404907226562, 3.8007049560546875, 4.013969421386719, 4.22723388671875, 4.440498352050781, 4.6537628173828125, 4.867027282714844, 5.080291748046875, 5.293556213378906, 5.5068206787109375, 5.720085144042969, 5.933349609375, 6.146614074707031, 6.3598785400390625, 6.573143005371094, 6.786407470703125, 6.999671936035156, 7.2129364013671875, 7.426200866699219, 7.63946533203125, 7.852729797363281, 8.065994262695312, 8.279258728027344, 8.492523193359375, 8.705787658691406, 8.919052124023438, 9.132316589355469, 9.3455810546875, 9.558845520019531, 9.772109985351562, 9.985374450683594, 10.198638916015625, 10.411903381347656, 10.625167846679688, 10.838432312011719, 11.05169677734375, 11.264961242675781, 11.478225708007812, 11.691490173339844, 11.904754638671875, 12.118019104003906, 12.331283569335938, 12.544548034667969, 12.7578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 27.0, 104.0, 298.0, 351.0, 177.0, 48.0, 11.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023223876953125, -0.017798900604248047, -0.012373924255371094, -0.006948947906494141, -0.0015239715576171875, 0.0039010047912597656, 0.009325981140136719, 0.014750957489013672, 0.020175933837890625, 0.025600910186767578, 0.03102588653564453, 0.036450862884521484, 0.04187583923339844, 0.04730081558227539, 0.052725791931152344, 0.0581507682800293, 0.06357574462890625, 0.0690007209777832, 0.07442569732666016, 0.07985067367553711, 0.08527565002441406, 0.09070062637329102, 0.09612560272216797, 0.10155057907104492, 0.10697555541992188, 0.11240053176879883, 0.11782550811767578, 0.12325048446655273, 0.1286754608154297, 0.13410043716430664, 0.1395254135131836, 0.14495038986206055, 0.1503753662109375, 0.15580034255981445, 0.1612253189086914, 0.16665029525756836, 0.1720752716064453, 0.17750024795532227, 0.18292522430419922, 0.18835020065307617, 0.19377517700195312, 0.19920015335083008, 0.20462512969970703, 0.21005010604858398, 0.21547508239746094, 0.2209000587463379, 0.22632503509521484, 0.2317500114440918, 0.23717498779296875, 0.2425999641418457, 0.24802494049072266, 0.2534499168395996, 0.25887489318847656, 0.2642998695373535, 0.26972484588623047, 0.2751498222351074, 0.2805747985839844, 0.28599977493286133, 0.2914247512817383, 0.29684972763061523, 0.3022747039794922, 0.30769968032836914, 0.3131246566772461, 0.31854963302612305, 0.323974609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 13.0, 16.0, 23.0, 33.0, 58.0, 89.0, 176.0, 352.0, 813.0, 2949.0, 19311.0, 4098754.0, 66214.0, 3737.0, 1010.0, 335.0, 170.0, 92.0, 62.0, 35.0, 25.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.2980499267578125, -2.238677978515625, -2.1793060302734375, -2.11993408203125, -2.0605621337890625, -2.001190185546875, -1.9418182373046875, -1.8824462890625, -1.8230743408203125, -1.763702392578125, -1.7043304443359375, -1.64495849609375, -1.5855865478515625, -1.526214599609375, -1.4668426513671875, -1.407470703125, -1.3480987548828125, -1.288726806640625, -1.2293548583984375, -1.16998291015625, -1.1106109619140625, -1.051239013671875, -0.9918670654296875, -0.9324951171875, -0.8731231689453125, -0.813751220703125, -0.7543792724609375, -0.69500732421875, -0.6356353759765625, -0.576263427734375, -0.5168914794921875, -0.45751953125, -0.3981475830078125, -0.338775634765625, -0.2794036865234375, -0.22003173828125, -0.1606597900390625, -0.101287841796875, -0.0419158935546875, 0.0174560546875, 0.0768280029296875, 0.136199951171875, 0.1955718994140625, 0.25494384765625, 0.3143157958984375, 0.373687744140625, 0.4330596923828125, 0.492431640625, 0.5518035888671875, 0.611175537109375, 0.6705474853515625, 0.72991943359375, 0.7892913818359375, 0.848663330078125, 0.9080352783203125, 0.9674072265625, 1.0267791748046875, 1.086151123046875, 1.1455230712890625, 1.20489501953125, 1.2642669677734375, 1.323638916015625, 1.3830108642578125, 1.4423828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 15.0, 8.0, 16.0, 31.0, 39.0, 81.0, 158.0, 2431.0, 1116.0, 110.0, 40.0, 15.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.39052581787109375, -0.3816375732421875, -0.37274932861328125, -0.363861083984375, -0.35497283935546875, -0.3460845947265625, -0.33719635009765625, -0.32830810546875, -0.31941986083984375, -0.3105316162109375, -0.30164337158203125, -0.292755126953125, -0.28386688232421875, -0.2749786376953125, -0.26609039306640625, -0.2572021484375, -0.24831390380859375, -0.2394256591796875, -0.23053741455078125, -0.221649169921875, -0.21276092529296875, -0.2038726806640625, -0.19498443603515625, -0.18609619140625, -0.17720794677734375, -0.1683197021484375, -0.15943145751953125, -0.150543212890625, -0.14165496826171875, -0.1327667236328125, -0.12387847900390625, -0.114990234375, -0.10610198974609375, -0.0972137451171875, -0.08832550048828125, -0.079437255859375, -0.07054901123046875, -0.0616607666015625, -0.05277252197265625, -0.04388427734375, -0.03499603271484375, -0.0261077880859375, -0.01721954345703125, -0.008331298828125, 0.00055694580078125, 0.0094451904296875, 0.01833343505859375, 0.0272216796875, 0.03610992431640625, 0.0449981689453125, 0.05388641357421875, 0.062774658203125, 0.07166290283203125, 0.0805511474609375, 0.08943939208984375, 0.09832763671875, 0.10721588134765625, 0.1161041259765625, 0.12499237060546875, 0.133880615234375, 0.14276885986328125, 0.1516571044921875, 0.16054534912109375, 0.16943359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 22.0, 33.0, 79.0, 217.0, 431.0, 146.0, 42.0, 10.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462117910385132, -2.3997251987457275, -2.3373324871063232, -2.27493953704834, -2.2125468254089355, -2.1501541137695312, -2.087761402130127, -2.0253686904907227, -1.9629758596420288, -1.9005831480026245, -1.8381903171539307, -1.7757976055145264, -1.713404893875122, -1.6510120630264282, -1.588619351387024, -1.52622652053833, -1.4638338088989258, -1.4014410972595215, -1.3390482664108276, -1.2766555547714233, -1.214262843132019, -1.1518700122833252, -1.089477300643921, -1.0270845890045166, -0.9646918773651123, -0.9022991061210632, -0.8399063944816589, -0.7775136232376099, -0.7151208519935608, -0.6527280807495117, -0.5903353691101074, -0.5279425978660583, -0.4655498266220093, -0.4031570851802826, -0.3407643139362335, -0.27837157249450684, -0.21597881615161896, -0.15358605980873108, -0.0911933183670044, -0.028800547122955322, 0.03359219431877136, 0.09598495066165924, 0.15837770700454712, 0.2207704484462738, 0.2831631898880005, 0.34555596113204956, 0.40794870257377625, 0.4703414738178253, 0.532734215259552, 0.5951269865036011, 0.6575196981430054, 0.7199124693870544, 0.7823052406311035, 0.8446979522705078, 0.9070907235145569, 0.969483494758606, 1.0318762063980103, 1.0942689180374146, 1.1566617488861084, 1.2190544605255127, 1.281447172164917, 1.3438400030136108, 1.4062327146530151, 1.468625545501709, 1.5310182571411133]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 16.0, 12.0, 23.0, 20.0, 36.0, 53.0, 70.0, 84.0, 98.0, 88.0, 88.0, 69.0, 84.0, 75.0, 48.0, 43.0, 27.0, 19.0, 13.0, 12.0, 9.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2092745304107666, -1.174912691116333, -1.1405508518218994, -1.1061891317367554, -1.0718272924423218, -1.0374654531478882, -1.0031036138534546, -0.968741774559021, -0.9343799948692322, -0.9000181555747986, -0.8656563758850098, -0.8312945365905762, -0.7969326972961426, -0.7625709176063538, -0.7282090783119202, -0.6938472986221313, -0.6594854593276978, -0.6251236200332642, -0.5907618403434753, -0.5564000010490417, -0.5220382213592529, -0.48767638206481934, -0.45331454277038574, -0.41895273327827454, -0.38459092378616333, -0.3502291142940521, -0.3158673048019409, -0.2815054655075073, -0.24714365601539612, -0.2127818465232849, -0.1784200221300125, -0.1440581977367401, -0.10969632863998413, -0.07533451169729233, -0.040972694754600525, -0.006610877811908722, 0.02775093913078308, 0.06211274862289429, 0.09647457301616669, 0.1308363974094391, 0.1651982069015503, 0.1995600163936615, 0.2339218407869339, 0.2682836651802063, 0.3026454746723175, 0.3370072841644287, 0.3713691234588623, 0.4057309329509735, 0.4400927424430847, 0.4744545519351959, 0.5088163614273071, 0.5431782007217407, 0.5775400400161743, 0.6119018197059631, 0.6462636590003967, 0.6806254386901855, 0.7149872779846191, 0.7493491172790527, 0.7837108969688416, 0.8180727362632751, 0.852434515953064, 0.8867963552474976, 0.9211581945419312, 0.9555200338363647, 0.9898818135261536]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 17.0, 12.0, 19.0, 18.0, 25.0, 35.0, 29.0, 48.0, 61.0, 129.0, 572.0, 9393.0, 933074.0, 102208.0, 2281.0, 255.0, 73.0, 53.0, 41.0, 28.0, 19.0, 25.0, 16.0, 18.0, 21.0, 11.0, 9.0, 7.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6865234375, -1.6365814208984375, -1.586639404296875, -1.5366973876953125, -1.48675537109375, -1.4368133544921875, -1.386871337890625, -1.3369293212890625, -1.2869873046875, -1.2370452880859375, -1.187103271484375, -1.1371612548828125, -1.08721923828125, -1.0372772216796875, -0.987335205078125, -0.9373931884765625, -0.887451171875, -0.8375091552734375, -0.787567138671875, -0.7376251220703125, -0.68768310546875, -0.6377410888671875, -0.587799072265625, -0.5378570556640625, -0.4879150390625, -0.4379730224609375, -0.388031005859375, -0.3380889892578125, -0.28814697265625, -0.2382049560546875, -0.188262939453125, -0.1383209228515625, -0.08837890625, -0.0384368896484375, 0.011505126953125, 0.0614471435546875, 0.11138916015625, 0.1613311767578125, 0.211273193359375, 0.2612152099609375, 0.3111572265625, 0.3610992431640625, 0.411041259765625, 0.4609832763671875, 0.51092529296875, 0.5608673095703125, 0.610809326171875, 0.6607513427734375, 0.710693359375, 0.7606353759765625, 0.810577392578125, 0.8605194091796875, 0.91046142578125, 0.9604034423828125, 1.010345458984375, 1.0602874755859375, 1.1102294921875, 1.1601715087890625, 1.210113525390625, 1.2600555419921875, 1.30999755859375, 1.3599395751953125, 1.409881591796875, 1.4598236083984375, 1.509765625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 24.0, 69.0, 137.0, 283.0, 252.0, 156.0, 62.0, 22.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047149658203125, -0.04127836227416992, -0.035407066345214844, -0.029535770416259766, -0.023664474487304688, -0.01779317855834961, -0.011921882629394531, -0.006050586700439453, -0.000179290771484375, 0.005692005157470703, 0.011563301086425781, 0.01743459701538086, 0.023305892944335938, 0.029177188873291016, 0.035048484802246094, 0.04091978073120117, 0.04679107666015625, 0.05266237258911133, 0.058533668518066406, 0.06440496444702148, 0.07027626037597656, 0.07614755630493164, 0.08201885223388672, 0.0878901481628418, 0.09376144409179688, 0.09963274002075195, 0.10550403594970703, 0.11137533187866211, 0.11724662780761719, 0.12311792373657227, 0.12898921966552734, 0.13486051559448242, 0.1407318115234375, 0.14660310745239258, 0.15247440338134766, 0.15834569931030273, 0.1642169952392578, 0.1700882911682129, 0.17595958709716797, 0.18183088302612305, 0.18770217895507812, 0.1935734748840332, 0.19944477081298828, 0.20531606674194336, 0.21118736267089844, 0.21705865859985352, 0.2229299545288086, 0.22880125045776367, 0.23467254638671875, 0.24054384231567383, 0.2464151382446289, 0.252286434173584, 0.25815773010253906, 0.26402902603149414, 0.2699003219604492, 0.2757716178894043, 0.2816429138183594, 0.28751420974731445, 0.29338550567626953, 0.2992568016052246, 0.3051280975341797, 0.31099939346313477, 0.31687068939208984, 0.3227419853210449, 0.32861328125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 4.0, 5.0, 5.0, 7.0, 14.0, 19.0, 26.0, 23.0, 43.0, 54.0, 74.0, 89.0, 149.0, 205.0, 351.0, 639.0, 1297.0, 3724.0, 13764.0, 81292.0, 645779.0, 258087.0, 31476.0, 6928.0, 2154.0, 942.0, 478.0, 298.0, 158.0, 128.0, 80.0, 73.0, 55.0, 38.0, 28.0, 16.0, 16.0, 8.0, 8.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2730865478515625, -0.262481689453125, -0.2518768310546875, -0.24127197265625, -0.2306671142578125, -0.220062255859375, -0.2094573974609375, -0.1988525390625, -0.1882476806640625, -0.177642822265625, -0.1670379638671875, -0.15643310546875, -0.1458282470703125, -0.135223388671875, -0.1246185302734375, -0.114013671875, -0.1034088134765625, -0.092803955078125, -0.0821990966796875, -0.07159423828125, -0.0609893798828125, -0.050384521484375, -0.0397796630859375, -0.0291748046875, -0.0185699462890625, -0.007965087890625, 0.0026397705078125, 0.01324462890625, 0.0238494873046875, 0.034454345703125, 0.0450592041015625, 0.0556640625, 0.0662689208984375, 0.076873779296875, 0.0874786376953125, 0.09808349609375, 0.1086883544921875, 0.119293212890625, 0.1298980712890625, 0.1405029296875, 0.1511077880859375, 0.161712646484375, 0.1723175048828125, 0.18292236328125, 0.1935272216796875, 0.204132080078125, 0.2147369384765625, 0.225341796875, 0.2359466552734375, 0.246551513671875, 0.2571563720703125, 0.26776123046875, 0.2783660888671875, 0.288970947265625, 0.2995758056640625, 0.3101806640625, 0.3207855224609375, 0.331390380859375, 0.3419952392578125, 0.35260009765625, 0.3632049560546875, 0.373809814453125, 0.3844146728515625, 0.39501953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 4.0, 8.0, 8.0, 17.0, 15.0, 13.0, 16.0, 19.0, 31.0, 44.0, 42.0, 35.0, 50.0, 47.0, 48.0, 59.0, 42.0, 57.0, 50.0, 57.0, 39.0, 50.0, 37.0, 37.0, 30.0, 19.0, 22.0, 17.0, 19.0, 11.0, 14.0, 7.0, 10.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14498138427734375, -0.1390838623046875, -0.13318634033203125, -0.127288818359375, -0.12139129638671875, -0.1154937744140625, -0.10959625244140625, -0.10369873046875, -0.09780120849609375, -0.0919036865234375, -0.08600616455078125, -0.080108642578125, -0.07421112060546875, -0.0683135986328125, -0.06241607666015625, -0.0565185546875, -0.05062103271484375, -0.0447235107421875, -0.03882598876953125, -0.032928466796875, -0.02703094482421875, -0.0211334228515625, -0.01523590087890625, -0.00933837890625, -0.00344085693359375, 0.0024566650390625, 0.00835418701171875, 0.014251708984375, 0.02014923095703125, 0.0260467529296875, 0.03194427490234375, 0.037841796875, 0.04373931884765625, 0.0496368408203125, 0.05553436279296875, 0.061431884765625, 0.06732940673828125, 0.0732269287109375, 0.07912445068359375, 0.08502197265625, 0.09091949462890625, 0.0968170166015625, 0.10271453857421875, 0.108612060546875, 0.11450958251953125, 0.1204071044921875, 0.12630462646484375, 0.1322021484375, 0.13809967041015625, 0.1439971923828125, 0.14989471435546875, 0.155792236328125, 0.16168975830078125, 0.1675872802734375, 0.17348480224609375, 0.17938232421875, 0.18527984619140625, 0.1911773681640625, 0.19707489013671875, 0.202972412109375, 0.20886993408203125, 0.2147674560546875, 0.22066497802734375, 0.2265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 16.0, 18.0, 46.0, 67.0, 152.0, 316.0, 976.0, 5618.0, 342589.0, 689270.0, 7577.0, 1149.0, 427.0, 170.0, 71.0, 30.0, 19.0, 16.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472412109375, -0.4542884826660156, -0.43616485595703125, -0.4180412292480469, -0.3999176025390625, -0.3817939758300781, -0.36367034912109375, -0.3455467224121094, -0.327423095703125, -0.3092994689941406, -0.29117584228515625, -0.2730522155761719, -0.2549285888671875, -0.23680496215820312, -0.21868133544921875, -0.20055770874023438, -0.18243408203125, -0.16431045532226562, -0.14618682861328125, -0.12806320190429688, -0.1099395751953125, -0.09181594848632812, -0.07369232177734375, -0.055568695068359375, -0.037445068359375, -0.019321441650390625, -0.00119781494140625, 0.016925811767578125, 0.0350494384765625, 0.053173065185546875, 0.07129669189453125, 0.08942031860351562, 0.1075439453125, 0.12566757202148438, 0.14379119873046875, 0.16191482543945312, 0.1800384521484375, 0.19816207885742188, 0.21628570556640625, 0.23440933227539062, 0.252532958984375, 0.2706565856933594, 0.28878021240234375, 0.3069038391113281, 0.3250274658203125, 0.3431510925292969, 0.36127471923828125, 0.3793983459472656, 0.39752197265625, 0.4156455993652344, 0.43376922607421875, 0.4518928527832031, 0.4700164794921875, 0.4881401062011719, 0.5062637329101562, 0.5243873596191406, 0.542510986328125, 0.5606346130371094, 0.5787582397460938, 0.5968818664550781, 0.6150054931640625, 0.6331291198730469, 0.6512527465820312, 0.6693763732910156, 0.6875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 9.0, 4.0, 5.0, 10.0, 34.0, 52.0, 118.0, 219.0, 256.0, 148.0, 84.0, 42.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0007457733154296875, -0.0007314775139093399, -0.0007171817123889923, -0.0007028859108686447, -0.0006885901093482971, -0.0006742943078279495, -0.0006599985063076019, -0.0006457027047872543, -0.0006314069032669067, -0.0006171111017465591, -0.0006028153002262115, -0.000588519498705864, -0.0005742236971855164, -0.0005599278956651688, -0.0005456320941448212, -0.0005313362926244736, -0.000517040491104126, -0.0005027446895837784, -0.0004884488880634308, -0.0004741530865430832, -0.0004598572850227356, -0.000445561483502388, -0.0004312656819820404, -0.0004169698804616928, -0.0004026740789413452, -0.0003883782774209976, -0.00037408247590065, -0.00035978667438030243, -0.00034549087285995483, -0.00033119507133960724, -0.00031689926981925964, -0.00030260346829891205, -0.00028830766677856445, -0.00027401186525821686, -0.00025971606373786926, -0.00024542026221752167, -0.00023112446069717407, -0.00021682865917682648, -0.00020253285765647888, -0.0001882370561361313, -0.0001739412546157837, -0.0001596454530954361, -0.0001453496515750885, -0.0001310538500547409, -0.00011675804853439331, -0.00010246224701404572, -8.816644549369812e-05, -7.387064397335052e-05, -5.957484245300293e-05, -4.5279040932655334e-05, -3.098323941230774e-05, -1.6687437891960144e-05, -2.391636371612549e-06, 1.1904165148735046e-05, 2.619996666908264e-05, 4.049576818943024e-05, 5.479156970977783e-05, 6.908737123012543e-05, 8.338317275047302e-05, 9.767897427082062e-05, 0.00011197477579116821, 0.0001262705773115158, 0.0001405663788318634, 0.000154862180352211, 0.0001691579818725586]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 7.0, 17.0, 12.0, 38.0, 47.0, 90.0, 168.0, 312.0, 764.0, 2403.0, 11244.0, 148976.0, 829740.0, 46140.0, 5955.0, 1493.0, 584.0, 240.0, 117.0, 65.0, 50.0, 30.0, 12.0, 16.0, 13.0, 6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.260498046875, -0.249786376953125, -0.23907470703125, -0.228363037109375, -0.2176513671875, -0.206939697265625, -0.19622802734375, -0.185516357421875, -0.1748046875, -0.164093017578125, -0.15338134765625, -0.142669677734375, -0.1319580078125, -0.121246337890625, -0.11053466796875, -0.099822998046875, -0.089111328125, -0.078399658203125, -0.06768798828125, -0.056976318359375, -0.0462646484375, -0.035552978515625, -0.02484130859375, -0.014129638671875, -0.00341796875, 0.007293701171875, 0.01800537109375, 0.028717041015625, 0.0394287109375, 0.050140380859375, 0.06085205078125, 0.071563720703125, 0.082275390625, 0.092987060546875, 0.10369873046875, 0.114410400390625, 0.1251220703125, 0.135833740234375, 0.14654541015625, 0.157257080078125, 0.16796875, 0.178680419921875, 0.18939208984375, 0.200103759765625, 0.2108154296875, 0.221527099609375, 0.23223876953125, 0.242950439453125, 0.253662109375, 0.264373779296875, 0.27508544921875, 0.285797119140625, 0.2965087890625, 0.307220458984375, 0.31793212890625, 0.328643798828125, 0.33935546875, 0.350067138671875, 0.36077880859375, 0.371490478515625, 0.3822021484375, 0.392913818359375, 0.40362548828125, 0.414337158203125, 0.425048828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 5.0, 7.0, 11.0, 9.0, 27.0, 61.0, 107.0, 142.0, 178.0, 171.0, 115.0, 62.0, 38.0, 20.0, 15.0, 6.0, 7.0, 2.0, 3.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1136474609375, -0.10819244384765625, -0.1027374267578125, -0.09728240966796875, -0.091827392578125, -0.08637237548828125, -0.0809173583984375, -0.07546234130859375, -0.07000732421875, -0.06455230712890625, -0.0590972900390625, -0.05364227294921875, -0.048187255859375, -0.04273223876953125, -0.0372772216796875, -0.03182220458984375, -0.0263671875, -0.02091217041015625, -0.0154571533203125, -0.01000213623046875, -0.004547119140625, 0.00090789794921875, 0.0063629150390625, 0.01181793212890625, 0.01727294921875, 0.02272796630859375, 0.0281829833984375, 0.03363800048828125, 0.039093017578125, 0.04454803466796875, 0.0500030517578125, 0.05545806884765625, 0.0609130859375, 0.06636810302734375, 0.0718231201171875, 0.07727813720703125, 0.082733154296875, 0.08818817138671875, 0.0936431884765625, 0.09909820556640625, 0.10455322265625, 0.11000823974609375, 0.1154632568359375, 0.12091827392578125, 0.126373291015625, 0.13182830810546875, 0.1372833251953125, 0.14273834228515625, 0.148193359375, 0.15364837646484375, 0.1591033935546875, 0.16455841064453125, 0.170013427734375, 0.17546844482421875, 0.1809234619140625, 0.18637847900390625, 0.19183349609375, 0.19728851318359375, 0.2027435302734375, 0.20819854736328125, 0.213653564453125, 0.21910858154296875, 0.2245635986328125, 0.23001861572265625, 0.2354736328125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 20.0, 136.0, 645.0, 179.0, 22.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.646785736083984, -9.466341018676758, -9.285895347595215, -9.105450630187988, -8.925005912780762, -8.744560241699219, -8.564115524291992, -8.383670806884766, -8.203225135803223, -8.022780418395996, -7.842335224151611, -7.661890029907227, -7.481444835662842, -7.300999641418457, -7.1205549240112305, -6.940109729766846, -6.759665012359619, -6.579219818115234, -6.398775100708008, -6.218329906463623, -6.037884712219238, -5.857439994812012, -5.676994800567627, -5.496549606323242, -5.316104888916016, -5.135659694671631, -4.955214977264404, -4.7747697830200195, -4.594324588775635, -4.41387939453125, -4.233434677124023, -4.052989482879639, -3.872544765472412, -3.6920998096466064, -3.5116546154022217, -3.331209659576416, -3.1507644653320312, -2.9703195095062256, -2.78987455368042, -2.609429359436035, -2.4289841651916504, -2.2485392093658447, -2.06809401512146, -1.8876490592956543, -1.707203984260559, -1.5267589092254639, -1.3463139533996582, -1.165868878364563, -0.9854239225387573, -0.8049788475036621, -0.6245338320732117, -0.44408881664276123, -0.263643741607666, -0.0831986665725708, 0.09724628925323486, 0.2776913642883301, 0.4581364393234253, 0.6385815143585205, 0.819026529788971, 0.9994715452194214, 1.1799166202545166, 1.3603616952896118, 1.5408066511154175, 1.7212517261505127, 1.901696801185608]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 10.0, 13.0, 11.0, 10.0, 19.0, 24.0, 16.0, 24.0, 29.0, 38.0, 41.0, 44.0, 57.0, 48.0, 57.0, 67.0, 64.0, 54.0, 49.0, 48.0, 41.0, 46.0, 18.0, 37.0, 37.0, 18.0, 13.0, 19.0, 8.0, 12.0, 13.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5172576904296875, -1.4781373739242554, -1.4390170574188232, -1.3998967409133911, -1.360776424407959, -1.3216559886932373, -1.2825356721878052, -1.243415355682373, -1.204295039176941, -1.1651747226715088, -1.1260544061660767, -1.0869340896606445, -1.0478136539459229, -1.0086933374404907, -0.9695730209350586, -0.9304527044296265, -0.8913323879241943, -0.8522120714187622, -0.8130917549133301, -0.7739713788032532, -0.734851062297821, -0.6957307457923889, -0.656610369682312, -0.6174900531768799, -0.5783697366714478, -0.5392494201660156, -0.5001291036605835, -0.4610087275505066, -0.42188841104507446, -0.38276809453964233, -0.3436477482318878, -0.3045274019241333, -0.26540714502334595, -0.22628681361675262, -0.1871664822101593, -0.14804615080356598, -0.10892581939697266, -0.06980548799037933, -0.03068515658378601, 0.008435189723968506, 0.047555506229400635, 0.08667583763599396, 0.12579616904258728, 0.1649165004491806, 0.20403683185577393, 0.24315716326236725, 0.28227749466896057, 0.3213978409767151, 0.3605181574821472, 0.39963847398757935, 0.43875882029533386, 0.4778791666030884, 0.5169994831085205, 0.5561197996139526, 0.5952401161193848, 0.6343604922294617, 0.6734808087348938, 0.7126011252403259, 0.7517215013504028, 0.790841817855835, 0.8299621343612671, 0.8690824508666992, 0.9082027673721313, 0.9473231434822083, 0.9864434599876404]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 13.0, 30.0, 127.0, 590.0, 4489.0, 80867.0, 4069151.0, 34900.0, 2656.0, 531.0, 213.0, 131.0, 105.0, 87.0, 52.0, 56.0, 41.0, 33.0, 32.0, 25.0, 23.0, 21.0, 17.0, 15.0, 9.0, 12.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 6.0, 7.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.469970703125, -0.4247856140136719, -0.37960052490234375, -0.3344154357910156, -0.2892303466796875, -0.24404525756835938, -0.19886016845703125, -0.15367507934570312, -0.108489990234375, -0.06330490112304688, -0.01811981201171875, 0.027065277099609375, 0.0722503662109375, 0.11743545532226562, 0.16262054443359375, 0.20780563354492188, 0.25299072265625, 0.2981758117675781, 0.34336090087890625, 0.3885459899902344, 0.4337310791015625, 0.4789161682128906, 0.5241012573242188, 0.5692863464355469, 0.614471435546875, 0.6596565246582031, 0.7048416137695312, 0.7500267028808594, 0.7952117919921875, 0.8403968811035156, 0.8855819702148438, 0.9307670593261719, 0.9759521484375, 1.0211372375488281, 1.0663223266601562, 1.1115074157714844, 1.1566925048828125, 1.2018775939941406, 1.2470626831054688, 1.2922477722167969, 1.337432861328125, 1.3826179504394531, 1.4278030395507812, 1.4729881286621094, 1.5181732177734375, 1.5633583068847656, 1.6085433959960938, 1.6537284851074219, 1.69891357421875, 1.7440986633300781, 1.7892837524414062, 1.8344688415527344, 1.8796539306640625, 1.9248390197753906, 1.9700241088867188, 2.015209197998047, 2.060394287109375, 2.105579376220703, 2.1507644653320312, 2.1959495544433594, 2.2411346435546875, 2.2863197326660156, 2.3315048217773438, 2.376689910888672, 2.421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 12.0, 28.0, 75.0, 149.0, 219.0, 222.0, 178.0, 79.0, 36.0, 16.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039459228515625, -0.03395223617553711, -0.02844524383544922, -0.022938251495361328, -0.017431259155273438, -0.011924266815185547, -0.006417274475097656, -0.0009102821350097656, 0.004596710205078125, 0.010103702545166016, 0.015610694885253906, 0.021117687225341797, 0.026624679565429688, 0.03213167190551758, 0.03763866424560547, 0.04314565658569336, 0.04865264892578125, 0.05415964126586914, 0.05966663360595703, 0.06517362594604492, 0.07068061828613281, 0.0761876106262207, 0.0816946029663086, 0.08720159530639648, 0.09270858764648438, 0.09821557998657227, 0.10372257232666016, 0.10922956466674805, 0.11473655700683594, 0.12024354934692383, 0.12575054168701172, 0.1312575340270996, 0.1367645263671875, 0.1422715187072754, 0.14777851104736328, 0.15328550338745117, 0.15879249572753906, 0.16429948806762695, 0.16980648040771484, 0.17531347274780273, 0.18082046508789062, 0.18632745742797852, 0.1918344497680664, 0.1973414421081543, 0.2028484344482422, 0.20835542678833008, 0.21386241912841797, 0.21936941146850586, 0.22487640380859375, 0.23038339614868164, 0.23589038848876953, 0.24139738082885742, 0.2469043731689453, 0.2524113655090332, 0.2579183578491211, 0.263425350189209, 0.2689323425292969, 0.27443933486938477, 0.27994632720947266, 0.28545331954956055, 0.29096031188964844, 0.29646730422973633, 0.3019742965698242, 0.3074812889099121, 0.31298828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 9.0, 21.0, 43.0, 60.0, 92.0, 334.0, 1901.0, 4156803.0, 32916.0, 1447.0, 320.0, 128.0, 73.0, 58.0, 25.0, 17.0, 15.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2578125, -2.131103515625, -2.00439453125, -1.877685546875, -1.7509765625, -1.624267578125, -1.49755859375, -1.370849609375, -1.244140625, -1.117431640625, -0.99072265625, -0.864013671875, -0.7373046875, -0.610595703125, -0.48388671875, -0.357177734375, -0.23046875, -0.103759765625, 0.02294921875, 0.149658203125, 0.2763671875, 0.403076171875, 0.52978515625, 0.656494140625, 0.783203125, 0.909912109375, 1.03662109375, 1.163330078125, 1.2900390625, 1.416748046875, 1.54345703125, 1.670166015625, 1.796875, 1.923583984375, 2.05029296875, 2.177001953125, 2.3037109375, 2.430419921875, 2.55712890625, 2.683837890625, 2.810546875, 2.937255859375, 3.06396484375, 3.190673828125, 3.3173828125, 3.444091796875, 3.57080078125, 3.697509765625, 3.82421875, 3.950927734375, 4.07763671875, 4.204345703125, 4.3310546875, 4.457763671875, 4.58447265625, 4.711181640625, 4.837890625, 4.964599609375, 5.09130859375, 5.218017578125, 5.3447265625, 5.471435546875, 5.59814453125, 5.724853515625, 5.8515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 5.0, 12.0, 27.0, 77.0, 908.0, 2894.0, 106.0, 26.0, 14.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.086669921875, -0.07242202758789062, -0.05817413330078125, -0.043926239013671875, -0.0296783447265625, -0.015430450439453125, -0.00118255615234375, 0.013065338134765625, 0.027313232421875, 0.041561126708984375, 0.05580902099609375, 0.07005691528320312, 0.0843048095703125, 0.09855270385742188, 0.11280059814453125, 0.12704849243164062, 0.14129638671875, 0.15554428100585938, 0.16979217529296875, 0.18404006958007812, 0.1982879638671875, 0.21253585815429688, 0.22678375244140625, 0.24103164672851562, 0.255279541015625, 0.2695274353027344, 0.28377532958984375, 0.2980232238769531, 0.3122711181640625, 0.3265190124511719, 0.34076690673828125, 0.3550148010253906, 0.3692626953125, 0.3835105895996094, 0.39775848388671875, 0.4120063781738281, 0.4262542724609375, 0.4405021667480469, 0.45475006103515625, 0.4689979553222656, 0.483245849609375, 0.4974937438964844, 0.5117416381835938, 0.5259895324707031, 0.5402374267578125, 0.5544853210449219, 0.5687332153320312, 0.5829811096191406, 0.59722900390625, 0.6114768981933594, 0.6257247924804688, 0.6399726867675781, 0.6542205810546875, 0.6684684753417969, 0.6827163696289062, 0.6969642639160156, 0.711212158203125, 0.7254600524902344, 0.7397079467773438, 0.7539558410644531, 0.7682037353515625, 0.7824516296386719, 0.7966995239257812, 0.8109474182128906, 0.8251953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 19.0, 57.0, 356.0, 445.0, 80.0, 21.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3457646369934082, -1.2343119382858276, -1.122859239578247, -1.011406421661377, -0.8999537229537964, -0.7885010242462158, -0.6770482659339905, -0.5655955076217651, -0.45414280891418457, -0.3426900804042816, -0.23123735189437866, -0.11978462338447571, -0.008331894874572754, 0.10312080383300781, 0.21457356214523315, 0.3260263204574585, 0.43747901916503906, 0.5489317178726196, 0.660384476184845, 0.7718372344970703, 0.8832899332046509, 0.9947426319122314, 1.1061954498291016, 1.2176481485366821, 1.3291008472442627, 1.4405535459518433, 1.5520062446594238, 1.663459062576294, 1.7749117612838745, 1.886364459991455, 1.9978172779083252, 2.1092700958251953, 2.2207226753234863, 2.3321754932403564, 2.4436280727386475, 2.5550808906555176, 2.6665334701538086, 2.7779862880706787, 2.889439105987549, 3.00089168548584, 3.11234450340271, 3.22379732131958, 3.335249900817871, 3.446702718734741, 3.5581555366516113, 3.6696081161499023, 3.7810609340667725, 3.8925137519836426, 4.003966331481934, 4.115418910980225, 4.226871967315674, 4.338324546813965, 4.449777126312256, 4.561229705810547, 4.672682762145996, 4.784135341644287, 4.895587921142578, 5.007040500640869, 5.118493556976318, 5.229946136474609, 5.3413987159729, 5.452851295471191, 5.564304351806641, 5.675756931304932, 5.787209987640381]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 9.0, 12.0, 30.0, 29.0, 62.0, 84.0, 117.0, 109.0, 134.0, 124.0, 104.0, 77.0, 49.0, 27.0, 11.0, 11.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.885972499847412, -1.822251796722412, -1.758531093597412, -1.6948102712631226, -1.6310895681381226, -1.5673688650131226, -1.503648042678833, -1.439927339553833, -1.376206636428833, -1.312485933303833, -1.248765230178833, -1.1850444078445435, -1.1213237047195435, -1.0576030015945435, -0.9938822388648987, -0.9301614761352539, -0.8664407730102539, -0.8027200698852539, -0.7389993071556091, -0.6752785444259644, -0.6115578413009644, -0.5478371381759644, -0.4841163754463196, -0.4203956425189972, -0.3566749095916748, -0.2929541766643524, -0.22923344373703003, -0.16551271080970764, -0.10179197788238525, -0.038071244955062866, 0.02564948797225952, 0.08937022089958191, 0.1530909538269043, 0.21681168675422668, 0.2805324196815491, 0.34425315260887146, 0.40797388553619385, 0.47169461846351624, 0.5354153513908386, 0.5991361141204834, 0.6628568172454834, 0.7265775203704834, 0.7902982831001282, 0.854019045829773, 0.917739748954773, 0.981460452079773, 1.0451812744140625, 1.1089019775390625, 1.1726226806640625, 1.2363433837890625, 1.3000640869140625, 1.363784909248352, 1.427505612373352, 1.491226315498352, 1.5549471378326416, 1.6186678409576416, 1.6823885440826416, 1.7461092472076416, 1.8098299503326416, 1.8735507726669312, 1.9372714757919312, 2.0009922981262207, 2.0647130012512207, 2.1284337043762207, 2.1921544075012207]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 9.0, 10.0, 19.0, 26.0, 40.0, 53.0, 109.0, 228.0, 632.0, 2974.0, 40951.0, 954392.0, 44687.0, 3194.0, 636.0, 249.0, 103.0, 73.0, 41.0, 36.0, 19.0, 16.0, 10.0, 7.0, 8.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.0378875732421875, -0.993743896484375, -0.9496002197265625, -0.90545654296875, -0.8613128662109375, -0.817169189453125, -0.7730255126953125, -0.7288818359375, -0.6847381591796875, -0.640594482421875, -0.5964508056640625, -0.55230712890625, -0.5081634521484375, -0.464019775390625, -0.4198760986328125, -0.375732421875, -0.3315887451171875, -0.287445068359375, -0.2433013916015625, -0.19915771484375, -0.1550140380859375, -0.110870361328125, -0.0667266845703125, -0.0225830078125, 0.0215606689453125, 0.065704345703125, 0.1098480224609375, 0.15399169921875, 0.1981353759765625, 0.242279052734375, 0.2864227294921875, 0.33056640625, 0.3747100830078125, 0.418853759765625, 0.4629974365234375, 0.50714111328125, 0.5512847900390625, 0.595428466796875, 0.6395721435546875, 0.6837158203125, 0.7278594970703125, 0.772003173828125, 0.8161468505859375, 0.86029052734375, 0.9044342041015625, 0.948577880859375, 0.9927215576171875, 1.036865234375, 1.0810089111328125, 1.125152587890625, 1.1692962646484375, 1.21343994140625, 1.2575836181640625, 1.301727294921875, 1.3458709716796875, 1.3900146484375, 1.4341583251953125, 1.478302001953125, 1.5224456787109375, 1.56658935546875, 1.6107330322265625, 1.654876708984375, 1.6990203857421875, 1.7431640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 18.0, 37.0, 65.0, 123.0, 158.0, 184.0, 175.0, 110.0, 72.0, 41.0, 13.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11322021484375, -0.10639286041259766, -0.09956550598144531, -0.09273815155029297, -0.08591079711914062, -0.07908344268798828, -0.07225608825683594, -0.0654287338256836, -0.05860137939453125, -0.051774024963378906, -0.04494667053222656, -0.03811931610107422, -0.031291961669921875, -0.02446460723876953, -0.017637252807617188, -0.010809898376464844, -0.0039825439453125, 0.0028448104858398438, 0.009672164916992188, 0.01649951934814453, 0.023326873779296875, 0.03015422821044922, 0.03698158264160156, 0.043808937072753906, 0.05063629150390625, 0.057463645935058594, 0.06429100036621094, 0.07111835479736328, 0.07794570922851562, 0.08477306365966797, 0.09160041809082031, 0.09842777252197266, 0.105255126953125, 0.11208248138427734, 0.11890983581542969, 0.12573719024658203, 0.13256454467773438, 0.13939189910888672, 0.14621925354003906, 0.1530466079711914, 0.15987396240234375, 0.1667013168334961, 0.17352867126464844, 0.18035602569580078, 0.18718338012695312, 0.19401073455810547, 0.2008380889892578, 0.20766544342041016, 0.2144927978515625, 0.22132015228271484, 0.2281475067138672, 0.23497486114501953, 0.24180221557617188, 0.24862957000732422, 0.25545692443847656, 0.2622842788696289, 0.26911163330078125, 0.2759389877319336, 0.28276634216308594, 0.2895936965942383, 0.2964210510253906, 0.30324840545654297, 0.3100757598876953, 0.31690311431884766, 0.32373046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 6.0, 11.0, 14.0, 8.0, 19.0, 20.0, 28.0, 36.0, 56.0, 65.0, 95.0, 170.0, 315.0, 496.0, 968.0, 2170.0, 5623.0, 19488.0, 114126.0, 711974.0, 156845.0, 24687.0, 6451.0, 2372.0, 1061.0, 553.0, 319.0, 174.0, 114.0, 67.0, 68.0, 32.0, 28.0, 16.0, 18.0, 8.0, 12.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.449951171875, -0.435699462890625, -0.42144775390625, -0.407196044921875, -0.3929443359375, -0.378692626953125, -0.36444091796875, -0.350189208984375, -0.3359375, -0.321685791015625, -0.30743408203125, -0.293182373046875, -0.2789306640625, -0.264678955078125, -0.25042724609375, -0.236175537109375, -0.221923828125, -0.207672119140625, -0.19342041015625, -0.179168701171875, -0.1649169921875, -0.150665283203125, -0.13641357421875, -0.122161865234375, -0.10791015625, -0.093658447265625, -0.07940673828125, -0.065155029296875, -0.0509033203125, -0.036651611328125, -0.02239990234375, -0.008148193359375, 0.006103515625, 0.020355224609375, 0.03460693359375, 0.048858642578125, 0.0631103515625, 0.077362060546875, 0.09161376953125, 0.105865478515625, 0.1201171875, 0.134368896484375, 0.14862060546875, 0.162872314453125, 0.1771240234375, 0.191375732421875, 0.20562744140625, 0.219879150390625, 0.234130859375, 0.248382568359375, 0.26263427734375, 0.276885986328125, 0.2911376953125, 0.305389404296875, 0.31964111328125, 0.333892822265625, 0.34814453125, 0.362396240234375, 0.37664794921875, 0.390899658203125, 0.4051513671875, 0.419403076171875, 0.43365478515625, 0.447906494140625, 0.462158203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 17.0, 14.0, 20.0, 20.0, 35.0, 36.0, 40.0, 42.0, 63.0, 64.0, 64.0, 63.0, 70.0, 65.0, 69.0, 51.0, 46.0, 43.0, 38.0, 22.0, 26.0, 21.0, 18.0, 6.0, 8.0, 4.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.376220703125, -0.36444854736328125, -0.3526763916015625, -0.34090423583984375, -0.329132080078125, -0.31735992431640625, -0.3055877685546875, -0.29381561279296875, -0.28204345703125, -0.27027130126953125, -0.2584991455078125, -0.24672698974609375, -0.234954833984375, -0.22318267822265625, -0.2114105224609375, -0.19963836669921875, -0.1878662109375, -0.17609405517578125, -0.1643218994140625, -0.15254974365234375, -0.140777587890625, -0.12900543212890625, -0.1172332763671875, -0.10546112060546875, -0.09368896484375, -0.08191680908203125, -0.0701446533203125, -0.05837249755859375, -0.046600341796875, -0.03482818603515625, -0.0230560302734375, -0.01128387451171875, 0.00048828125, 0.01226043701171875, 0.0240325927734375, 0.03580474853515625, 0.047576904296875, 0.05934906005859375, 0.0711212158203125, 0.08289337158203125, 0.09466552734375, 0.10643768310546875, 0.1182098388671875, 0.12998199462890625, 0.141754150390625, 0.15352630615234375, 0.1652984619140625, 0.17707061767578125, 0.1888427734375, 0.20061492919921875, 0.2123870849609375, 0.22415924072265625, 0.235931396484375, 0.24770355224609375, 0.2594757080078125, 0.27124786376953125, 0.28302001953125, 0.29479217529296875, 0.3065643310546875, 0.31833648681640625, 0.330108642578125, 0.34188079833984375, 0.3536529541015625, 0.36542510986328125, 0.377197265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 17.0, 15.0, 16.0, 20.0, 34.0, 63.0, 90.0, 162.0, 234.0, 505.0, 1164.0, 3032.0, 8804.0, 35771.0, 296613.0, 597271.0, 81599.0, 15035.0, 4695.0, 1705.0, 772.0, 367.0, 198.0, 97.0, 66.0, 50.0, 41.0, 14.0, 22.0, 11.0, 10.0, 9.0, 10.0, 9.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1551513671875, -0.15033531188964844, -0.14551925659179688, -0.1407032012939453, -0.13588714599609375, -0.1310710906982422, -0.12625503540039062, -0.12143898010253906, -0.1166229248046875, -0.11180686950683594, -0.10699081420898438, -0.10217475891113281, -0.09735870361328125, -0.09254264831542969, -0.08772659301757812, -0.08291053771972656, -0.078094482421875, -0.07327842712402344, -0.06846237182617188, -0.06364631652832031, -0.05883026123046875, -0.05401420593261719, -0.049198150634765625, -0.04438209533691406, -0.0395660400390625, -0.03474998474121094, -0.029933929443359375, -0.025117874145507812, -0.02030181884765625, -0.015485763549804688, -0.010669708251953125, -0.0058536529541015625, -0.00103759765625, 0.0037784576416015625, 0.008594512939453125, 0.013410568237304688, 0.01822662353515625, 0.023042678833007812, 0.027858734130859375, 0.03267478942871094, 0.0374908447265625, 0.04230690002441406, 0.047122955322265625, 0.05193901062011719, 0.05675506591796875, 0.06157112121582031, 0.06638717651367188, 0.07120323181152344, 0.076019287109375, 0.08083534240722656, 0.08565139770507812, 0.09046745300292969, 0.09528350830078125, 0.10009956359863281, 0.10491561889648438, 0.10973167419433594, 0.1145477294921875, 0.11936378479003906, 0.12417984008789062, 0.1289958953857422, 0.13381195068359375, 0.1386280059814453, 0.14344406127929688, 0.14826011657714844, 0.153076171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 18.0, 14.0, 17.0, 26.0, 32.0, 55.0, 32.0, 51.0, 74.0, 82.0, 91.0, 105.0, 64.0, 67.0, 53.0, 43.0, 38.0, 26.0, 26.0, 19.0, 14.0, 13.0, 10.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00016570091247558594, -0.00016160588711500168, -0.00015751086175441742, -0.00015341583639383316, -0.0001493208110332489, -0.00014522578567266464, -0.00014113076031208038, -0.00013703573495149612, -0.00013294070959091187, -0.0001288456842303276, -0.00012475065886974335, -0.00012065563350915909, -0.00011656060814857483, -0.00011246558278799057, -0.00010837055742740631, -0.00010427553206682205, -0.00010018050670623779, -9.608548134565353e-05, -9.199045598506927e-05, -8.789543062448502e-05, -8.380040526390076e-05, -7.97053799033165e-05, -7.561035454273224e-05, -7.151532918214798e-05, -6.742030382156372e-05, -6.332527846097946e-05, -5.92302531003952e-05, -5.5135227739810944e-05, -5.1040202379226685e-05, -4.6945177018642426e-05, -4.2850151658058167e-05, -3.875512629747391e-05, -3.466010093688965e-05, -3.056507557630539e-05, -2.647005021572113e-05, -2.237502485513687e-05, -1.8279999494552612e-05, -1.4184974133968353e-05, -1.0089948773384094e-05, -5.994923412799835e-06, -1.8998980522155762e-06, 2.195127308368683e-06, 6.290152668952942e-06, 1.0385178029537201e-05, 1.448020339012146e-05, 1.857522875070572e-05, 2.2670254111289978e-05, 2.6765279471874237e-05, 3.0860304832458496e-05, 3.4955330193042755e-05, 3.9050355553627014e-05, 4.314538091421127e-05, 4.724040627479553e-05, 5.133543163537979e-05, 5.543045699596405e-05, 5.952548235654831e-05, 6.362050771713257e-05, 6.771553307771683e-05, 7.181055843830109e-05, 7.590558379888535e-05, 8.00006091594696e-05, 8.409563452005386e-05, 8.819065988063812e-05, 9.228568524122238e-05, 9.638071060180664e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 6.0, 3.0, 17.0, 18.0, 25.0, 34.0, 63.0, 75.0, 162.0, 313.0, 711.0, 1804.0, 5311.0, 21146.0, 230386.0, 704729.0, 67817.0, 10672.0, 3090.0, 1160.0, 458.0, 209.0, 140.0, 80.0, 47.0, 25.0, 9.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.1578693389892578, -0.15228652954101562, -0.14670372009277344, -0.14112091064453125, -0.13553810119628906, -0.12995529174804688, -0.12437248229980469, -0.1187896728515625, -0.11320686340332031, -0.10762405395507812, -0.10204124450683594, -0.09645843505859375, -0.09087562561035156, -0.08529281616210938, -0.07971000671386719, -0.074127197265625, -0.06854438781738281, -0.06296157836914062, -0.05737876892089844, -0.05179595947265625, -0.04621315002441406, -0.040630340576171875, -0.03504753112792969, -0.0294647216796875, -0.023881912231445312, -0.018299102783203125, -0.012716293334960938, -0.00713348388671875, -0.0015506744384765625, 0.004032135009765625, 0.009614944458007812, 0.01519775390625, 0.020780563354492188, 0.026363372802734375, 0.03194618225097656, 0.03752899169921875, 0.04311180114746094, 0.048694610595703125, 0.05427742004394531, 0.0598602294921875, 0.06544303894042969, 0.07102584838867188, 0.07660865783691406, 0.08219146728515625, 0.08777427673339844, 0.09335708618164062, 0.09893989562988281, 0.104522705078125, 0.11010551452636719, 0.11568832397460938, 0.12127113342285156, 0.12685394287109375, 0.13243675231933594, 0.13801956176757812, 0.1436023712158203, 0.1491851806640625, 0.1547679901123047, 0.16035079956054688, 0.16593360900878906, 0.17151641845703125, 0.17709922790527344, 0.18268203735351562, 0.1882648468017578, 0.19384765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 7.0, 5.0, 11.0, 15.0, 29.0, 35.0, 58.0, 108.0, 138.0, 147.0, 130.0, 108.0, 80.0, 57.0, 25.0, 18.0, 12.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09002685546875, -0.08619022369384766, -0.08235359191894531, -0.07851696014404297, -0.07468032836914062, -0.07084369659423828, -0.06700706481933594, -0.0631704330444336, -0.05933380126953125, -0.055497169494628906, -0.05166053771972656, -0.04782390594482422, -0.043987274169921875, -0.04015064239501953, -0.03631401062011719, -0.032477378845214844, -0.0286407470703125, -0.024804115295410156, -0.020967483520507812, -0.01713085174560547, -0.013294219970703125, -0.009457588195800781, -0.0056209564208984375, -0.0017843246459960938, 0.00205230712890625, 0.005888938903808594, 0.009725570678710938, 0.013562202453613281, 0.017398834228515625, 0.02123546600341797, 0.025072097778320312, 0.028908729553222656, 0.032745361328125, 0.036581993103027344, 0.04041862487792969, 0.04425525665283203, 0.048091888427734375, 0.05192852020263672, 0.05576515197753906, 0.059601783752441406, 0.06343841552734375, 0.0672750473022461, 0.07111167907714844, 0.07494831085205078, 0.07878494262695312, 0.08262157440185547, 0.08645820617675781, 0.09029483795166016, 0.0941314697265625, 0.09796810150146484, 0.10180473327636719, 0.10564136505126953, 0.10947799682617188, 0.11331462860107422, 0.11715126037597656, 0.1209878921508789, 0.12482452392578125, 0.1286611557006836, 0.13249778747558594, 0.13633441925048828, 0.14017105102539062, 0.14400768280029297, 0.1478443145751953, 0.15168094635009766, 0.155517578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 8.0, 7.0, 25.0, 77.0, 189.0, 383.0, 218.0, 59.0, 26.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.911895275115967, -2.7886033058166504, -2.665311336517334, -2.5420193672180176, -2.4187276363372803, -2.295435667037964, -2.1721436977386475, -2.048851728439331, -1.9255597591400146, -1.8022677898406982, -1.6789759397506714, -1.555683970451355, -1.4323920011520386, -1.3091001510620117, -1.1858081817626953, -1.062516212463379, -0.939224362373352, -0.8159324526786804, -0.692640483379364, -0.5693485736846924, -0.44605663418769836, -0.32276469469070435, -0.19947278499603271, -0.07618081569671631, 0.04711109399795532, 0.17040303349494934, 0.29369497299194336, 0.416986882686615, 0.5402787923812866, 0.663570761680603, 0.7868626713752747, 0.9101546406745911, 1.0334465503692627, 1.156738519668579, 1.280030369758606, 1.4033223390579224, 1.5266143083572388, 1.6499061584472656, 1.773198127746582, 1.8964900970458984, 2.019782066345215, 2.1430740356445312, 2.2663660049438477, 2.389657974243164, 2.5129497051239014, 2.6362416744232178, 2.759533643722534, 2.8828256130218506, 3.006117343902588, 3.1294093132019043, 3.2527012825012207, 3.375993251800537, 3.4992849826812744, 3.622576951980591, 3.7458689212799072, 3.8691608905792236, 3.99245285987854, 4.115744590759277, 4.239036560058594, 4.36232852935791, 4.485620498657227, 4.608912467956543, 4.732204437255859, 4.855496406555176, 4.978788375854492]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 7.0, 8.0, 6.0, 16.0, 19.0, 17.0, 15.0, 29.0, 29.0, 35.0, 39.0, 39.0, 51.0, 43.0, 53.0, 42.0, 74.0, 54.0, 46.0, 50.0, 54.0, 40.0, 37.0, 27.0, 33.0, 30.0, 29.0, 18.0, 11.0, 10.0, 13.0, 11.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4132628440856934, -1.359816074371338, -1.3063693046569824, -1.252922534942627, -1.199475884437561, -1.1460291147232056, -1.09258234500885, -1.0391355752944946, -0.9856888055801392, -0.9322420358657837, -0.878795325756073, -0.8253485560417175, -0.7719017863273621, -0.7184550762176514, -0.6650083065032959, -0.6115615367889404, -0.5581148266792297, -0.5046680569648743, -0.4512213170528412, -0.3977745771408081, -0.34432780742645264, -0.29088106751441956, -0.23743432760238647, -0.183987557888031, -0.13054081797599792, -0.07709406316280365, -0.023647315800189972, 0.029799431562423706, 0.08324618637561798, 0.13669294118881226, 0.19013968110084534, 0.2435864508152008, 0.2970331907272339, 0.35047993063926697, 0.40392670035362244, 0.4573734402656555, 0.510820209980011, 0.5642669200897217, 0.6177136898040771, 0.6711604595184326, 0.7246072292327881, 0.7780539989471436, 0.8315007090568542, 0.8849474787712097, 0.9383942484855652, 0.9918409585952759, 1.0452877283096313, 1.0987344980239868, 1.1521811485290527, 1.2056279182434082, 1.2590746879577637, 1.3125214576721191, 1.365968108177185, 1.4194148778915405, 1.472861647605896, 1.5263084173202515, 1.579755187034607, 1.6332019567489624, 1.6866487264633179, 1.7400953769683838, 1.7935421466827393, 1.8469889163970947, 1.9004356861114502, 1.9538824558258057, 2.007329225540161]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 4.0, 19.0, 19.0, 27.0, 75.0, 146.0, 375.0, 923.0, 3046.0, 15142.0, 243294.0, 3888614.0, 34492.0, 5147.0, 1379.0, 591.0, 285.0, 181.0, 120.0, 90.0, 70.0, 41.0, 36.0, 23.0, 16.0, 24.0, 15.0, 16.0, 12.0, 12.0, 8.0, 3.0, 9.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.465087890625, -0.4345054626464844, -0.40392303466796875, -0.3733406066894531, -0.3427581787109375, -0.3121757507324219, -0.28159332275390625, -0.2510108947753906, -0.220428466796875, -0.18984603881835938, -0.15926361083984375, -0.12868118286132812, -0.0980987548828125, -0.06751632690429688, -0.03693389892578125, -0.006351470947265625, 0.02423095703125, 0.054813385009765625, 0.08539581298828125, 0.11597824096679688, 0.1465606689453125, 0.17714309692382812, 0.20772552490234375, 0.23830795288085938, 0.268890380859375, 0.2994728088378906, 0.33005523681640625, 0.3606376647949219, 0.3912200927734375, 0.4218025207519531, 0.45238494873046875, 0.4829673767089844, 0.5135498046875, 0.5441322326660156, 0.5747146606445312, 0.6052970886230469, 0.6358795166015625, 0.6664619445800781, 0.6970443725585938, 0.7276268005371094, 0.758209228515625, 0.7887916564941406, 0.8193740844726562, 0.8499565124511719, 0.8805389404296875, 0.9111213684082031, 0.9417037963867188, 0.9722862243652344, 1.00286865234375, 1.0334510803222656, 1.0640335083007812, 1.0946159362792969, 1.1251983642578125, 1.1557807922363281, 1.1863632202148438, 1.2169456481933594, 1.247528076171875, 1.2781105041503906, 1.3086929321289062, 1.3392753601074219, 1.3698577880859375, 1.4004402160644531, 1.4310226440429688, 1.4616050720214844, 1.4921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 21.0, 37.0, 60.0, 125.0, 139.0, 168.0, 164.0, 128.0, 77.0, 48.0, 20.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083251953125, -0.07669448852539062, -0.07013702392578125, -0.06357955932617188, -0.0570220947265625, -0.050464630126953125, -0.04390716552734375, -0.037349700927734375, -0.030792236328125, -0.024234771728515625, -0.01767730712890625, -0.011119842529296875, -0.0045623779296875, 0.001995086669921875, 0.00855255126953125, 0.015110015869140625, 0.02166748046875, 0.028224945068359375, 0.03478240966796875, 0.041339874267578125, 0.0478973388671875, 0.054454803466796875, 0.06101226806640625, 0.06756973266601562, 0.074127197265625, 0.08068466186523438, 0.08724212646484375, 0.09379959106445312, 0.1003570556640625, 0.10691452026367188, 0.11347198486328125, 0.12002944946289062, 0.1265869140625, 0.13314437866210938, 0.13970184326171875, 0.14625930786132812, 0.1528167724609375, 0.15937423706054688, 0.16593170166015625, 0.17248916625976562, 0.179046630859375, 0.18560409545898438, 0.19216156005859375, 0.19871902465820312, 0.2052764892578125, 0.21183395385742188, 0.21839141845703125, 0.22494888305664062, 0.23150634765625, 0.23806381225585938, 0.24462127685546875, 0.2511787414550781, 0.2577362060546875, 0.2642936706542969, 0.27085113525390625, 0.2774085998535156, 0.283966064453125, 0.2905235290527344, 0.29708099365234375, 0.3036384582519531, 0.3101959228515625, 0.3167533874511719, 0.32331085205078125, 0.3298683166503906, 0.33642578125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 17.0, 28.0, 37.0, 85.0, 141.0, 307.0, 629.0, 2103.0, 19959.0, 4148945.0, 18391.0, 2170.0, 752.0, 355.0, 159.0, 89.0, 40.0, 36.0, 8.0, 11.0, 6.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4443359375, -1.395355224609375, -1.34637451171875, -1.297393798828125, -1.2484130859375, -1.199432373046875, -1.15045166015625, -1.101470947265625, -1.052490234375, -1.003509521484375, -0.95452880859375, -0.905548095703125, -0.8565673828125, -0.807586669921875, -0.75860595703125, -0.709625244140625, -0.66064453125, -0.611663818359375, -0.56268310546875, -0.513702392578125, -0.4647216796875, -0.415740966796875, -0.36676025390625, -0.317779541015625, -0.268798828125, -0.219818115234375, -0.17083740234375, -0.121856689453125, -0.0728759765625, -0.023895263671875, 0.02508544921875, 0.074066162109375, 0.123046875, 0.172027587890625, 0.22100830078125, 0.269989013671875, 0.3189697265625, 0.367950439453125, 0.41693115234375, 0.465911865234375, 0.514892578125, 0.563873291015625, 0.61285400390625, 0.661834716796875, 0.7108154296875, 0.759796142578125, 0.80877685546875, 0.857757568359375, 0.90673828125, 0.955718994140625, 1.00469970703125, 1.053680419921875, 1.1026611328125, 1.151641845703125, 1.20062255859375, 1.249603271484375, 1.298583984375, 1.347564697265625, 1.39654541015625, 1.445526123046875, 1.4945068359375, 1.543487548828125, 1.59246826171875, 1.641448974609375, 1.6904296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 8.0, 3.0, 6.0, 17.0, 54.0, 237.0, 2769.0, 794.0, 111.0, 38.0, 17.0, 11.0, 5.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.220703125, -0.2121429443359375, -0.203582763671875, -0.1950225830078125, -0.18646240234375, -0.1779022216796875, -0.169342041015625, -0.1607818603515625, -0.1522216796875, -0.1436614990234375, -0.135101318359375, -0.1265411376953125, -0.11798095703125, -0.1094207763671875, -0.100860595703125, -0.0923004150390625, -0.083740234375, -0.0751800537109375, -0.066619873046875, -0.0580596923828125, -0.04949951171875, -0.0409393310546875, -0.032379150390625, -0.0238189697265625, -0.0152587890625, -0.0066986083984375, 0.001861572265625, 0.0104217529296875, 0.01898193359375, 0.0275421142578125, 0.036102294921875, 0.0446624755859375, 0.05322265625, 0.0617828369140625, 0.070343017578125, 0.0789031982421875, 0.08746337890625, 0.0960235595703125, 0.104583740234375, 0.1131439208984375, 0.1217041015625, 0.1302642822265625, 0.138824462890625, 0.1473846435546875, 0.15594482421875, 0.1645050048828125, 0.173065185546875, 0.1816253662109375, 0.190185546875, 0.1987457275390625, 0.207305908203125, 0.2158660888671875, 0.22442626953125, 0.2329864501953125, 0.241546630859375, 0.2501068115234375, 0.2586669921875, 0.2672271728515625, 0.275787353515625, 0.2843475341796875, 0.29290771484375, 0.3014678955078125, 0.310028076171875, 0.3185882568359375, 0.3271484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 10.0, 60.0, 338.0, 464.0, 91.0, 25.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.004013776779175, -2.925145149230957, -2.8462765216827393, -2.7674078941345215, -2.6885392665863037, -2.609670639038086, -2.530802011489868, -2.4519333839416504, -2.3730649948120117, -2.294196367263794, -2.215327739715576, -2.1364591121673584, -2.0575904846191406, -1.9787218570709229, -1.8998533487319946, -1.8209847211837769, -1.7421159744262695, -1.6632473468780518, -1.584378719329834, -1.5055100917816162, -1.4266414642333984, -1.3477728366851807, -1.2689043283462524, -1.1900357007980347, -1.111167073249817, -1.0322984457015991, -0.9534298181533813, -0.8745612502098083, -0.7956926226615906, -0.7168239951133728, -0.6379554271697998, -0.559086799621582, -0.48021793365478516, -0.4013493061065674, -0.322480708360672, -0.24361209571361542, -0.16474348306655884, -0.08587485551834106, -0.007006257772445679, 0.07186233997344971, 0.15073096752166748, 0.22959958016872406, 0.30846819281578064, 0.387336790561676, 0.4662054181098938, 0.5450740456581116, 0.6239426136016846, 0.7028112411499023, 0.7816798686981201, 0.8605484962463379, 0.9394171237945557, 1.0182857513427734, 1.0971543788909912, 1.176023006439209, 1.2548915147781372, 1.333760142326355, 1.4126287698745728, 1.4914973974227905, 1.5703660249710083, 1.649234652519226, 1.7281031608581543, 1.806971788406372, 1.8858404159545898, 1.9647090435028076, 2.0435776710510254]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 11.0, 1.0, 11.0, 7.0, 18.0, 17.0, 32.0, 46.0, 48.0, 55.0, 55.0, 78.0, 66.0, 66.0, 68.0, 71.0, 62.0, 55.0, 48.0, 45.0, 40.0, 18.0, 25.0, 16.0, 15.0, 12.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6948535442352295, -0.6740829348564148, -0.6533122658729553, -0.6325416564941406, -0.6117710471153259, -0.5910004377365112, -0.5702297687530518, -0.5494591593742371, -0.5286885499954224, -0.5079179406166077, -0.4871473014354706, -0.4663766622543335, -0.4456060528755188, -0.4248354136943817, -0.40406477451324463, -0.38329416513442993, -0.36252349615097046, -0.3417528569698334, -0.3209822475910187, -0.3002116084098816, -0.2794409990310669, -0.2586703598499298, -0.23789972066879272, -0.21712909638881683, -0.19635847210884094, -0.17558784782886505, -0.15481722354888916, -0.13404658436775208, -0.11327596008777618, -0.09250533580780029, -0.0717347040772438, -0.05096407234668732, -0.030193448066711426, -0.009422820061445236, 0.011347807943820953, 0.03211843594908714, 0.05288906395435333, 0.07365968823432922, 0.09443031996488571, 0.1152009516954422, 0.1359715759754181, 0.15674220025539398, 0.17751282453536987, 0.19828346371650696, 0.21905408799648285, 0.23982471227645874, 0.2605953514575958, 0.2813659906387329, 0.3021366000175476, 0.3229072391986847, 0.3436778485774994, 0.3644484877586365, 0.38521909713745117, 0.40598973631858826, 0.42676037549972534, 0.44753098487854004, 0.4683016240596771, 0.4890722632408142, 0.5098428726196289, 0.5306134819984436, 0.5513841509819031, 0.5721547603607178, 0.5929253697395325, 0.6136960387229919, 0.6344666481018066]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 13.0, 24.0, 20.0, 39.0, 45.0, 97.0, 186.0, 422.0, 1227.0, 5814.0, 148310.0, 866920.0, 21686.0, 2471.0, 715.0, 256.0, 121.0, 54.0, 41.0, 36.0, 16.0, 13.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.56640625, -1.52545166015625, -1.4844970703125, -1.44354248046875, -1.402587890625, -1.36163330078125, -1.3206787109375, -1.27972412109375, -1.23876953125, -1.19781494140625, -1.1568603515625, -1.11590576171875, -1.074951171875, -1.03399658203125, -0.9930419921875, -0.95208740234375, -0.9111328125, -0.87017822265625, -0.8292236328125, -0.78826904296875, -0.747314453125, -0.70635986328125, -0.6654052734375, -0.62445068359375, -0.58349609375, -0.54254150390625, -0.5015869140625, -0.46063232421875, -0.419677734375, -0.37872314453125, -0.3377685546875, -0.29681396484375, -0.255859375, -0.21490478515625, -0.1739501953125, -0.13299560546875, -0.092041015625, -0.05108642578125, -0.0101318359375, 0.03082275390625, 0.07177734375, 0.11273193359375, 0.1536865234375, 0.19464111328125, 0.235595703125, 0.27655029296875, 0.3175048828125, 0.35845947265625, 0.3994140625, 0.44036865234375, 0.4813232421875, 0.52227783203125, 0.563232421875, 0.60418701171875, 0.6451416015625, 0.68609619140625, 0.72705078125, 0.76800537109375, 0.8089599609375, 0.84991455078125, 0.890869140625, 0.93182373046875, 0.9727783203125, 1.01373291015625, 1.0546875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 9.0, 16.0, 37.0, 58.0, 78.0, 121.0, 128.0, 150.0, 135.0, 108.0, 78.0, 38.0, 25.0, 11.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08734130859375, -0.08079242706298828, -0.07424354553222656, -0.06769466400146484, -0.061145782470703125, -0.054596900939941406, -0.04804801940917969, -0.04149913787841797, -0.03495025634765625, -0.02840137481689453, -0.021852493286132812, -0.015303611755371094, -0.008754730224609375, -0.0022058486938476562, 0.0043430328369140625, 0.010891914367675781, 0.0174407958984375, 0.02398967742919922, 0.030538558959960938, 0.037087440490722656, 0.043636322021484375, 0.050185203552246094, 0.05673408508300781, 0.06328296661376953, 0.06983184814453125, 0.07638072967529297, 0.08292961120605469, 0.0894784927368164, 0.09602737426757812, 0.10257625579833984, 0.10912513732910156, 0.11567401885986328, 0.122222900390625, 0.12877178192138672, 0.13532066345214844, 0.14186954498291016, 0.14841842651367188, 0.1549673080444336, 0.1615161895751953, 0.16806507110595703, 0.17461395263671875, 0.18116283416748047, 0.1877117156982422, 0.1942605972290039, 0.20080947875976562, 0.20735836029052734, 0.21390724182128906, 0.22045612335205078, 0.2270050048828125, 0.23355388641357422, 0.24010276794433594, 0.24665164947509766, 0.2532005310058594, 0.2597494125366211, 0.2662982940673828, 0.27284717559814453, 0.27939605712890625, 0.28594493865966797, 0.2924938201904297, 0.2990427017211914, 0.3055915832519531, 0.31214046478271484, 0.31868934631347656, 0.3252382278442383, 0.331787109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 2.0, 11.0, 9.0, 15.0, 25.0, 32.0, 50.0, 94.0, 185.0, 401.0, 927.0, 2265.0, 7543.0, 47571.0, 770289.0, 195701.0, 16908.0, 3930.0, 1325.0, 582.0, 291.0, 163.0, 77.0, 41.0, 32.0, 27.0, 18.0, 10.0, 7.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5313262939453125, -0.507965087890625, -0.4846038818359375, -0.46124267578125, -0.4378814697265625, -0.414520263671875, -0.3911590576171875, -0.3677978515625, -0.3444366455078125, -0.321075439453125, -0.2977142333984375, -0.27435302734375, -0.2509918212890625, -0.227630615234375, -0.2042694091796875, -0.180908203125, -0.1575469970703125, -0.134185791015625, -0.1108245849609375, -0.08746337890625, -0.0641021728515625, -0.040740966796875, -0.0173797607421875, 0.0059814453125, 0.0293426513671875, 0.052703857421875, 0.0760650634765625, 0.09942626953125, 0.1227874755859375, 0.146148681640625, 0.1695098876953125, 0.19287109375, 0.2162322998046875, 0.239593505859375, 0.2629547119140625, 0.28631591796875, 0.3096771240234375, 0.333038330078125, 0.3563995361328125, 0.3797607421875, 0.4031219482421875, 0.426483154296875, 0.4498443603515625, 0.47320556640625, 0.4965667724609375, 0.519927978515625, 0.5432891845703125, 0.566650390625, 0.5900115966796875, 0.613372802734375, 0.6367340087890625, 0.66009521484375, 0.6834564208984375, 0.706817626953125, 0.7301788330078125, 0.7535400390625, 0.7769012451171875, 0.800262451171875, 0.8236236572265625, 0.84698486328125, 0.8703460693359375, 0.893707275390625, 0.9170684814453125, 0.9404296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 14.0, 10.0, 16.0, 21.0, 36.0, 44.0, 55.0, 78.0, 84.0, 77.0, 98.0, 96.0, 71.0, 48.0, 50.0, 43.0, 40.0, 27.0, 19.0, 23.0, 10.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4638671875, -0.44628143310546875, -0.4286956787109375, -0.41110992431640625, -0.393524169921875, -0.37593841552734375, -0.3583526611328125, -0.34076690673828125, -0.32318115234375, -0.30559539794921875, -0.2880096435546875, -0.27042388916015625, -0.252838134765625, -0.23525238037109375, -0.2176666259765625, -0.20008087158203125, -0.1824951171875, -0.16490936279296875, -0.1473236083984375, -0.12973785400390625, -0.112152099609375, -0.09456634521484375, -0.0769805908203125, -0.05939483642578125, -0.04180908203125, -0.02422332763671875, -0.0066375732421875, 0.01094818115234375, 0.028533935546875, 0.04611968994140625, 0.0637054443359375, 0.08129119873046875, 0.098876953125, 0.11646270751953125, 0.1340484619140625, 0.15163421630859375, 0.169219970703125, 0.18680572509765625, 0.2043914794921875, 0.22197723388671875, 0.23956298828125, 0.25714874267578125, 0.2747344970703125, 0.29232025146484375, 0.309906005859375, 0.32749176025390625, 0.3450775146484375, 0.36266326904296875, 0.3802490234375, 0.39783477783203125, 0.4154205322265625, 0.43300628662109375, 0.450592041015625, 0.46817779541015625, 0.4857635498046875, 0.5033493041992188, 0.52093505859375, 0.5385208129882812, 0.5561065673828125, 0.5736923217773438, 0.591278076171875, 0.6088638305664062, 0.6264495849609375, 0.6440353393554688, 0.66162109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 13.0, 17.0, 30.0, 45.0, 53.0, 88.0, 177.0, 320.0, 736.0, 2177.0, 9480.0, 101504.0, 806593.0, 113455.0, 9968.0, 2280.0, 799.0, 365.0, 176.0, 77.0, 66.0, 38.0, 23.0, 16.0, 15.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1741943359375, -0.16762542724609375, -0.1610565185546875, -0.15448760986328125, -0.147918701171875, -0.14134979248046875, -0.1347808837890625, -0.12821197509765625, -0.12164306640625, -0.11507415771484375, -0.1085052490234375, -0.10193634033203125, -0.095367431640625, -0.08879852294921875, -0.0822296142578125, -0.07566070556640625, -0.069091796875, -0.06252288818359375, -0.0559539794921875, -0.04938507080078125, -0.042816162109375, -0.03624725341796875, -0.0296783447265625, -0.02310943603515625, -0.01654052734375, -0.00997161865234375, -0.0034027099609375, 0.00316619873046875, 0.009735107421875, 0.01630401611328125, 0.0228729248046875, 0.02944183349609375, 0.0360107421875, 0.04257965087890625, 0.0491485595703125, 0.05571746826171875, 0.062286376953125, 0.06885528564453125, 0.0754241943359375, 0.08199310302734375, 0.08856201171875, 0.09513092041015625, 0.1016998291015625, 0.10826873779296875, 0.114837646484375, 0.12140655517578125, 0.1279754638671875, 0.13454437255859375, 0.14111328125, 0.14768218994140625, 0.1542510986328125, 0.16082000732421875, 0.167388916015625, 0.17395782470703125, 0.1805267333984375, 0.18709564208984375, 0.19366455078125, 0.20023345947265625, 0.2068023681640625, 0.21337127685546875, 0.219940185546875, 0.22650909423828125, 0.2330780029296875, 0.23964691162109375, 0.2462158203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 10.0, 5.0, 10.0, 16.0, 28.0, 30.0, 65.0, 69.0, 106.0, 124.0, 142.0, 120.0, 92.0, 63.0, 48.0, 23.0, 13.0, 18.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001919269561767578, -0.0001851152628660202, -0.0001783035695552826, -0.00017149187624454498, -0.00016468018293380737, -0.00015786848962306976, -0.00015105679631233215, -0.00014424510300159454, -0.00013743340969085693, -0.00013062171638011932, -0.00012381002306938171, -0.0001169983297586441, -0.0001101866364479065, -0.00010337494313716888, -9.656324982643127e-05, -8.975155651569366e-05, -8.293986320495605e-05, -7.612816989421844e-05, -6.931647658348083e-05, -6.250478327274323e-05, -5.5693089962005615e-05, -4.8881396651268005e-05, -4.2069703340530396e-05, -3.5258010029792786e-05, -2.8446316719055176e-05, -2.1634623408317566e-05, -1.4822930097579956e-05, -8.011236786842346e-06, -1.1995434761047363e-06, 5.6121498346328735e-06, 1.2423843145370483e-05, 1.9235536456108093e-05, 2.6047229766845703e-05, 3.285892307758331e-05, 3.967061638832092e-05, 4.648230969905853e-05, 5.329400300979614e-05, 6.010569632053375e-05, 6.691738963127136e-05, 7.372908294200897e-05, 8.054077625274658e-05, 8.735246956348419e-05, 9.41641628742218e-05, 0.00010097585618495941, 0.00010778754949569702, 0.00011459924280643463, 0.00012141093611717224, 0.00012822262942790985, 0.00013503432273864746, 0.00014184601604938507, 0.00014865770936012268, 0.0001554694026708603, 0.0001622810959815979, 0.0001690927892923355, 0.00017590448260307312, 0.00018271617591381073, 0.00018952786922454834, 0.00019633956253528595, 0.00020315125584602356, 0.00020996294915676117, 0.00021677464246749878, 0.0002235863357782364, 0.000230398029088974, 0.0002372097223997116, 0.00024402141571044922]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 9.0, 5.0, 9.0, 10.0, 15.0, 35.0, 58.0, 84.0, 188.0, 353.0, 757.0, 2014.0, 7452.0, 55792.0, 730115.0, 229255.0, 16755.0, 3489.0, 1143.0, 492.0, 222.0, 126.0, 49.0, 46.0, 23.0, 18.0, 8.0, 9.0, 5.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1810302734375, -0.1749420166015625, -0.168853759765625, -0.1627655029296875, -0.15667724609375, -0.1505889892578125, -0.144500732421875, -0.1384124755859375, -0.13232421875, -0.1262359619140625, -0.120147705078125, -0.1140594482421875, -0.10797119140625, -0.1018829345703125, -0.095794677734375, -0.0897064208984375, -0.0836181640625, -0.0775299072265625, -0.071441650390625, -0.0653533935546875, -0.05926513671875, -0.0531768798828125, -0.047088623046875, -0.0410003662109375, -0.034912109375, -0.0288238525390625, -0.022735595703125, -0.0166473388671875, -0.01055908203125, -0.0044708251953125, 0.001617431640625, 0.0077056884765625, 0.0137939453125, 0.0198822021484375, 0.025970458984375, 0.0320587158203125, 0.03814697265625, 0.0442352294921875, 0.050323486328125, 0.0564117431640625, 0.0625, 0.0685882568359375, 0.074676513671875, 0.0807647705078125, 0.08685302734375, 0.0929412841796875, 0.099029541015625, 0.1051177978515625, 0.1112060546875, 0.1172943115234375, 0.123382568359375, 0.1294708251953125, 0.13555908203125, 0.1416473388671875, 0.147735595703125, 0.1538238525390625, 0.159912109375, 0.1660003662109375, 0.172088623046875, 0.1781768798828125, 0.18426513671875, 0.1903533935546875, 0.196441650390625, 0.2025299072265625, 0.2086181640625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 10.0, 11.0, 10.0, 26.0, 34.0, 71.0, 105.0, 134.0, 183.0, 140.0, 116.0, 65.0, 33.0, 14.0, 15.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.1299571990966797, -0.12539291381835938, -0.12082862854003906, -0.11626434326171875, -0.11170005798339844, -0.10713577270507812, -0.10257148742675781, -0.0980072021484375, -0.09344291687011719, -0.08887863159179688, -0.08431434631347656, -0.07975006103515625, -0.07518577575683594, -0.07062149047851562, -0.06605720520019531, -0.061492919921875, -0.05692863464355469, -0.052364349365234375, -0.04780006408691406, -0.04323577880859375, -0.03867149353027344, -0.034107208251953125, -0.029542922973632812, -0.0249786376953125, -0.020414352416992188, -0.015850067138671875, -0.011285781860351562, -0.00672149658203125, -0.0021572113037109375, 0.002407073974609375, 0.0069713592529296875, 0.01153564453125, 0.016099929809570312, 0.020664215087890625, 0.025228500366210938, 0.02979278564453125, 0.03435707092285156, 0.038921356201171875, 0.04348564147949219, 0.0480499267578125, 0.05261421203613281, 0.057178497314453125, 0.06174278259277344, 0.06630706787109375, 0.07087135314941406, 0.07543563842773438, 0.07999992370605469, 0.084564208984375, 0.08912849426269531, 0.09369277954101562, 0.09825706481933594, 0.10282135009765625, 0.10738563537597656, 0.11194992065429688, 0.11651420593261719, 0.1210784912109375, 0.1256427764892578, 0.13020706176757812, 0.13477134704589844, 0.13933563232421875, 0.14389991760253906, 0.14846420288085938, 0.1530284881591797, 0.1575927734375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 14.0, 40.0, 80.0, 241.0, 301.0, 183.0, 75.0, 37.0, 8.0, 10.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3282575607299805, -3.192124605178833, -3.0559914112091064, -2.919858455657959, -2.7837252616882324, -2.647592306137085, -2.5114593505859375, -2.375326156616211, -2.2391929626464844, -2.103060007095337, -1.9669268131256104, -1.830793857574463, -1.6946606636047363, -1.5585277080535889, -1.4223946332931519, -1.2862615585327148, -1.1501286029815674, -1.0139955282211304, -0.8778624534606934, -0.7417294383049011, -0.6055963635444641, -0.4694632887840271, -0.33333027362823486, -0.19719719886779785, -0.06106412410736084, 0.07506893575191498, 0.2112019956111908, 0.3473350405693054, 0.48346811532974243, 0.6196011900901794, 0.7557342052459717, 0.8918672800064087, 1.0280003547668457, 1.1641334295272827, 1.3002665042877197, 1.4363994598388672, 1.5725326538085938, 1.7086656093597412, 1.8447986841201782, 1.9809317588806152, 2.117064952850342, 2.2531979084014893, 2.389331102371216, 2.5254640579223633, 2.66159725189209, 2.7977302074432373, 2.9338631629943848, 3.0699963569641113, 3.206129312515259, 3.3422622680664062, 3.478395462036133, 3.6145284175872803, 3.750661611557007, 3.8867945671081543, 4.022927761077881, 4.159060478210449, 4.295193672180176, 4.431326866149902, 4.567459583282471, 4.703592777252197, 4.839725971221924, 4.97585916519165, 5.111991882324219, 5.248125076293945, 5.384258270263672]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 12.0, 12.0, 9.0, 10.0, 22.0, 34.0, 20.0, 28.0, 35.0, 32.0, 39.0, 35.0, 37.0, 50.0, 58.0, 49.0, 52.0, 55.0, 39.0, 32.0, 43.0, 42.0, 31.0, 21.0, 27.0, 31.0, 28.0, 15.0, 8.0, 15.0, 14.0, 12.0, 11.0, 12.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.8244390487670898, -1.764106273651123, -1.7037734985351562, -1.6434407234191895, -1.5831079483032227, -1.5227751731872559, -1.462442398071289, -1.4021096229553223, -1.3417768478393555, -1.2814440727233887, -1.2211112976074219, -1.160778522491455, -1.1004457473754883, -1.0401129722595215, -0.9797801375389099, -0.9194473624229431, -0.8591145277023315, -0.7987817525863647, -0.738448977470398, -0.6781162023544312, -0.6177834272384644, -0.5574506521224976, -0.497117817401886, -0.4367850422859192, -0.3764522671699524, -0.3161194920539856, -0.2557867169380188, -0.19545391201972961, -0.13512113690376282, -0.07478836178779602, -0.014455556869506836, 0.04587721824645996, 0.10620999336242676, 0.16654276847839355, 0.22687555849552155, 0.28720834851264954, 0.34754112362861633, 0.40787389874458313, 0.4682067036628723, 0.5285394787788391, 0.5888722538948059, 0.6492050290107727, 0.7095378041267395, 0.7698706388473511, 0.8302034139633179, 0.8905361890792847, 0.9508689641952515, 1.0112017393112183, 1.071534514427185, 1.1318672895431519, 1.1922000646591187, 1.2525328397750854, 1.3128656148910522, 1.373198390007019, 1.4335312843322754, 1.4938640594482422, 1.554196834564209, 1.6145296096801758, 1.6748623847961426, 1.7351951599121094, 1.7955279350280762, 1.855860710144043, 1.9161934852600098, 1.9765262603759766, 2.0368590354919434]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 9.0, 18.0, 55.0, 171.0, 474.0, 1645.0, 7558.0, 62672.0, 4013969.0, 94875.0, 9070.0, 1997.0, 735.0, 332.0, 205.0, 116.0, 81.0, 63.0, 50.0, 39.0, 24.0, 17.0, 20.0, 17.0, 14.0, 8.0, 4.0, 8.0, 5.0, 10.0, 8.0, 4.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4463157653808594, -0.40410614013671875, -0.3618965148925781, -0.3196868896484375, -0.2774772644042969, -0.23526763916015625, -0.19305801391601562, -0.150848388671875, -0.10863876342773438, -0.06642913818359375, -0.024219512939453125, 0.0179901123046875, 0.060199737548828125, 0.10240936279296875, 0.14461898803710938, 0.18682861328125, 0.22903823852539062, 0.27124786376953125, 0.3134574890136719, 0.3556671142578125, 0.3978767395019531, 0.44008636474609375, 0.4822959899902344, 0.524505615234375, 0.5667152404785156, 0.6089248657226562, 0.6511344909667969, 0.6933441162109375, 0.7355537414550781, 0.7777633666992188, 0.8199729919433594, 0.8621826171875, 0.9043922424316406, 0.9466018676757812, 0.9888114929199219, 1.0310211181640625, 1.0732307434082031, 1.1154403686523438, 1.1576499938964844, 1.199859619140625, 1.2420692443847656, 1.2842788696289062, 1.3264884948730469, 1.3686981201171875, 1.4109077453613281, 1.4531173706054688, 1.4953269958496094, 1.53753662109375, 1.5797462463378906, 1.6219558715820312, 1.6641654968261719, 1.7063751220703125, 1.7485847473144531, 1.7907943725585938, 1.8330039978027344, 1.875213623046875, 1.9174232482910156, 1.9596328735351562, 2.001842498779297, 2.0440521240234375, 2.086261749267578, 2.1284713745117188, 2.1706809997558594, 2.212890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 12.0, 21.0, 42.0, 50.0, 88.0, 137.0, 142.0, 137.0, 128.0, 108.0, 58.0, 52.0, 18.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07281494140625, -0.06629085540771484, -0.05976676940917969, -0.05324268341064453, -0.046718597412109375, -0.04019451141357422, -0.03367042541503906, -0.027146339416503906, -0.02062225341796875, -0.014098167419433594, -0.0075740814208984375, -0.0010499954223632812, 0.005474090576171875, 0.011998176574707031, 0.018522262573242188, 0.025046348571777344, 0.0315704345703125, 0.038094520568847656, 0.04461860656738281, 0.05114269256591797, 0.057666778564453125, 0.06419086456298828, 0.07071495056152344, 0.0772390365600586, 0.08376312255859375, 0.0902872085571289, 0.09681129455566406, 0.10333538055419922, 0.10985946655273438, 0.11638355255126953, 0.12290763854980469, 0.12943172454833984, 0.135955810546875, 0.14247989654541016, 0.1490039825439453, 0.15552806854248047, 0.16205215454101562, 0.16857624053955078, 0.17510032653808594, 0.1816244125366211, 0.18814849853515625, 0.1946725845336914, 0.20119667053222656, 0.20772075653076172, 0.21424484252929688, 0.22076892852783203, 0.2272930145263672, 0.23381710052490234, 0.2403411865234375, 0.24686527252197266, 0.2533893585205078, 0.25991344451904297, 0.2664375305175781, 0.2729616165161133, 0.27948570251464844, 0.2860097885131836, 0.29253387451171875, 0.2990579605102539, 0.30558204650878906, 0.3121061325073242, 0.3186302185058594, 0.32515430450439453, 0.3316783905029297, 0.33820247650146484, 0.3447265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 10.0, 20.0, 40.0, 46.0, 109.0, 244.0, 931.0, 6807.0, 4112493.0, 68397.0, 3773.0, 823.0, 263.0, 116.0, 57.0, 42.0, 37.0, 28.0, 16.0, 11.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.30712890625, -2.1962890625, -2.08544921875, -1.974609375, -1.86376953125, -1.7529296875, -1.64208984375, -1.53125, -1.42041015625, -1.3095703125, -1.19873046875, -1.087890625, -0.97705078125, -0.8662109375, -0.75537109375, -0.64453125, -0.53369140625, -0.4228515625, -0.31201171875, -0.201171875, -0.09033203125, 0.0205078125, 0.13134765625, 0.2421875, 0.35302734375, 0.4638671875, 0.57470703125, 0.685546875, 0.79638671875, 0.9072265625, 1.01806640625, 1.12890625, 1.23974609375, 1.3505859375, 1.46142578125, 1.572265625, 1.68310546875, 1.7939453125, 1.90478515625, 2.015625, 2.12646484375, 2.2373046875, 2.34814453125, 2.458984375, 2.56982421875, 2.6806640625, 2.79150390625, 2.90234375, 3.01318359375, 3.1240234375, 3.23486328125, 3.345703125, 3.45654296875, 3.5673828125, 3.67822265625, 3.7890625, 3.89990234375, 4.0107421875, 4.12158203125, 4.232421875, 4.34326171875, 4.4541015625, 4.56494140625, 4.67578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 12.0, 25.0, 73.0, 2441.0, 1340.0, 102.0, 25.0, 16.0, 5.0, 5.0, 5.0, 2.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302978515625, -0.2753257751464844, -0.24767303466796875, -0.22002029418945312, -0.1923675537109375, -0.16471481323242188, -0.13706207275390625, -0.10940933227539062, -0.081756591796875, -0.054103851318359375, -0.02645111083984375, 0.001201629638671875, 0.0288543701171875, 0.056507110595703125, 0.08415985107421875, 0.11181259155273438, 0.13946533203125, 0.16711807250976562, 0.19477081298828125, 0.22242355346679688, 0.2500762939453125, 0.2777290344238281, 0.30538177490234375, 0.3330345153808594, 0.360687255859375, 0.3883399963378906, 0.41599273681640625, 0.4436454772949219, 0.4712982177734375, 0.4989509582519531, 0.5266036987304688, 0.5542564392089844, 0.5819091796875, 0.6095619201660156, 0.6372146606445312, 0.6648674011230469, 0.6925201416015625, 0.7201728820800781, 0.7478256225585938, 0.7754783630371094, 0.803131103515625, 0.8307838439941406, 0.8584365844726562, 0.8860893249511719, 0.9137420654296875, 0.9413948059082031, 0.9690475463867188, 0.9967002868652344, 1.02435302734375, 1.0520057678222656, 1.0796585083007812, 1.1073112487792969, 1.1349639892578125, 1.1626167297363281, 1.1902694702148438, 1.2179222106933594, 1.245574951171875, 1.2732276916503906, 1.3008804321289062, 1.3285331726074219, 1.3561859130859375, 1.3838386535644531, 1.4114913940429688, 1.4391441345214844, 1.466796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 15.0, 74.0, 447.0, 370.0, 62.0, 21.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.511024236679077, -2.3305482864379883, -2.1500725746154785, -1.9695967435836792, -1.7891209125518799, -1.6086450815200806, -1.4281692504882812, -1.247693419456482, -1.0672175884246826, -0.8867417573928833, -0.706265926361084, -0.5257900953292847, -0.34531426429748535, -0.16483843326568604, 0.01563739776611328, 0.1961132287979126, 0.3765890598297119, 0.5570648908615112, 0.7375407218933105, 0.9180165529251099, 1.0984923839569092, 1.2789682149887085, 1.4594440460205078, 1.6399198770523071, 1.8203957080841064, 2.0008716583251953, 2.181347370147705, 2.361823081970215, 2.5422990322113037, 2.7227749824523926, 2.9032506942749023, 3.083726406097412, 3.264202117919922, 3.4446778297424316, 3.6251537799835205, 3.8056297302246094, 3.986105442047119, 4.166581153869629, 4.347057342529297, 4.527533054351807, 4.708008766174316, 4.888484477996826, 5.068960189819336, 5.249436378479004, 5.429912090301514, 5.610387802124023, 5.790863990783691, 5.971339702606201, 6.151815414428711, 6.332291126251221, 6.5127668380737305, 6.693243026733398, 6.873718738555908, 7.054194450378418, 7.234670639038086, 7.415146350860596, 7.5956220626831055, 7.776097774505615, 7.956573486328125, 8.137049674987793, 8.317525863647461, 8.498001098632812, 8.67847728729248, 8.858952522277832, 9.0394287109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 12.0, 36.0, 61.0, 98.0, 131.0, 148.0, 174.0, 139.0, 77.0, 66.0, 36.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7043089866638184, -3.5832324028015137, -3.462155818939209, -3.3410792350769043, -3.2200026512145996, -3.098926067352295, -2.9778494834899902, -2.8567731380462646, -2.73569655418396, -2.6146199703216553, -2.4935433864593506, -2.372466802597046, -2.251390218734741, -2.1303138732910156, -2.009237289428711, -1.8881607055664062, -1.767084002494812, -1.6460074186325073, -1.5249308347702026, -1.4038543701171875, -1.2827777862548828, -1.1617012023925781, -1.0406246185302734, -0.9195480942726135, -0.7984715104103088, -0.6773949265480042, -0.5563184022903442, -0.43524181842803955, -0.31416526436805725, -0.19308871030807495, -0.07201212644577026, 0.04906439781188965, 0.17014098167419434, 0.29121753573417664, 0.41229408979415894, 0.5333706736564636, 0.6544471979141235, 0.7755237817764282, 0.8966003656387329, 1.017676830291748, 1.1387534141540527, 1.2598299980163574, 1.380906581878662, 1.5019831657409668, 1.623059630393982, 1.7441362142562866, 1.8652127981185913, 1.9862892627716064, 2.1073660850524902, 2.228442668914795, 2.3495192527770996, 2.4705958366394043, 2.591672420501709, 2.7127490043640137, 2.8338255882263184, 2.954901933670044, 3.0759785175323486, 3.1970551013946533, 3.318131685256958, 3.4392082691192627, 3.5602848529815674, 3.681361198425293, 3.8024377822875977, 3.9235143661499023, 4.044590950012207]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 12.0, 14.0, 20.0, 26.0, 32.0, 54.0, 86.0, 95.0, 193.0, 356.0, 633.0, 1755.0, 9214.0, 147327.0, 832089.0, 49430.0, 4734.0, 1175.0, 511.0, 282.0, 158.0, 101.0, 66.0, 50.0, 42.0, 24.0, 14.0, 17.0, 12.0, 9.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1572265625, -1.1262283325195312, -1.0952301025390625, -1.0642318725585938, -1.033233642578125, -1.0022354125976562, -0.9712371826171875, -0.9402389526367188, -0.90924072265625, -0.8782424926757812, -0.8472442626953125, -0.8162460327148438, -0.785247802734375, -0.7542495727539062, -0.7232513427734375, -0.6922531127929688, -0.6612548828125, -0.6302566528320312, -0.5992584228515625, -0.5682601928710938, -0.537261962890625, -0.5062637329101562, -0.4752655029296875, -0.44426727294921875, -0.41326904296875, -0.38227081298828125, -0.3512725830078125, -0.32027435302734375, -0.289276123046875, -0.25827789306640625, -0.2272796630859375, -0.19628143310546875, -0.165283203125, -0.13428497314453125, -0.1032867431640625, -0.07228851318359375, -0.041290283203125, -0.01029205322265625, 0.0207061767578125, 0.05170440673828125, 0.08270263671875, 0.11370086669921875, 0.1446990966796875, 0.17569732666015625, 0.206695556640625, 0.23769378662109375, 0.2686920166015625, 0.29969024658203125, 0.3306884765625, 0.36168670654296875, 0.3926849365234375, 0.42368316650390625, 0.454681396484375, 0.48567962646484375, 0.5166778564453125, 0.5476760864257812, 0.57867431640625, 0.6096725463867188, 0.6406707763671875, 0.6716690063476562, 0.702667236328125, 0.7336654663085938, 0.7646636962890625, 0.7956619262695312, 0.82666015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 16.0, 39.0, 72.0, 137.0, 164.0, 153.0, 158.0, 117.0, 76.0, 45.0, 17.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2000732421875, -0.19156455993652344, -0.18305587768554688, -0.1745471954345703, -0.16603851318359375, -0.1575298309326172, -0.14902114868164062, -0.14051246643066406, -0.1320037841796875, -0.12349510192871094, -0.11498641967773438, -0.10647773742675781, -0.09796905517578125, -0.08946037292480469, -0.08095169067382812, -0.07244300842285156, -0.063934326171875, -0.05542564392089844, -0.046916961669921875, -0.03840827941894531, -0.02989959716796875, -0.021390914916992188, -0.012882232666015625, -0.0043735504150390625, 0.0041351318359375, 0.012643814086914062, 0.021152496337890625, 0.029661178588867188, 0.03816986083984375, 0.04667854309082031, 0.055187225341796875, 0.06369590759277344, 0.07220458984375, 0.08071327209472656, 0.08922195434570312, 0.09773063659667969, 0.10623931884765625, 0.11474800109863281, 0.12325668334960938, 0.13176536560058594, 0.1402740478515625, 0.14878273010253906, 0.15729141235351562, 0.1658000946044922, 0.17430877685546875, 0.1828174591064453, 0.19132614135742188, 0.19983482360839844, 0.208343505859375, 0.21685218811035156, 0.22536087036132812, 0.2338695526123047, 0.24237823486328125, 0.2508869171142578, 0.2593955993652344, 0.26790428161621094, 0.2764129638671875, 0.28492164611816406, 0.2934303283691406, 0.3019390106201172, 0.31044769287109375, 0.3189563751220703, 0.3274650573730469, 0.33597373962402344, 0.344482421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 14.0, 12.0, 20.0, 29.0, 40.0, 77.0, 129.0, 256.0, 553.0, 1413.0, 4775.0, 20745.0, 151283.0, 701305.0, 140833.0, 19910.0, 4667.0, 1397.0, 510.0, 223.0, 134.0, 64.0, 44.0, 36.0, 19.0, 18.0, 9.0, 9.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38330078125, -0.369354248046875, -0.35540771484375, -0.341461181640625, -0.3275146484375, -0.313568115234375, -0.29962158203125, -0.285675048828125, -0.271728515625, -0.257781982421875, -0.24383544921875, -0.229888916015625, -0.2159423828125, -0.201995849609375, -0.18804931640625, -0.174102783203125, -0.16015625, -0.146209716796875, -0.13226318359375, -0.118316650390625, -0.1043701171875, -0.090423583984375, -0.07647705078125, -0.062530517578125, -0.048583984375, -0.034637451171875, -0.02069091796875, -0.006744384765625, 0.0072021484375, 0.021148681640625, 0.03509521484375, 0.049041748046875, 0.06298828125, 0.076934814453125, 0.09088134765625, 0.104827880859375, 0.1187744140625, 0.132720947265625, 0.14666748046875, 0.160614013671875, 0.174560546875, 0.188507080078125, 0.20245361328125, 0.216400146484375, 0.2303466796875, 0.244293212890625, 0.25823974609375, 0.272186279296875, 0.2861328125, 0.300079345703125, 0.31402587890625, 0.327972412109375, 0.3419189453125, 0.355865478515625, 0.36981201171875, 0.383758544921875, 0.397705078125, 0.411651611328125, 0.42559814453125, 0.439544677734375, 0.4534912109375, 0.467437744140625, 0.48138427734375, 0.495330810546875, 0.50927734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 2.0, 2.0, 5.0, 7.0, 10.0, 6.0, 9.0, 15.0, 9.0, 21.0, 24.0, 31.0, 29.0, 41.0, 35.0, 51.0, 47.0, 41.0, 51.0, 50.0, 48.0, 59.0, 64.0, 55.0, 52.0, 46.0, 32.0, 39.0, 14.0, 28.0, 16.0, 11.0, 14.0, 11.0, 10.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27880859375, -0.2684898376464844, -0.25817108154296875, -0.24785232543945312, -0.2375335693359375, -0.22721481323242188, -0.21689605712890625, -0.20657730102539062, -0.196258544921875, -0.18593978881835938, -0.17562103271484375, -0.16530227661132812, -0.1549835205078125, -0.14466476440429688, -0.13434600830078125, -0.12402725219726562, -0.11370849609375, -0.10338973999023438, -0.09307098388671875, -0.08275222778320312, -0.0724334716796875, -0.062114715576171875, -0.05179595947265625, -0.041477203369140625, -0.031158447265625, -0.020839691162109375, -0.01052093505859375, -0.000202178955078125, 0.0101165771484375, 0.020435333251953125, 0.03075408935546875, 0.041072845458984375, 0.0513916015625, 0.061710357666015625, 0.07202911376953125, 0.08234786987304688, 0.0926666259765625, 0.10298538208007812, 0.11330413818359375, 0.12362289428710938, 0.133941650390625, 0.14426040649414062, 0.15457916259765625, 0.16489791870117188, 0.1752166748046875, 0.18553543090820312, 0.19585418701171875, 0.20617294311523438, 0.21649169921875, 0.22681045532226562, 0.23712921142578125, 0.24744796752929688, 0.2577667236328125, 0.2680854797363281, 0.27840423583984375, 0.2887229919433594, 0.299041748046875, 0.3093605041503906, 0.31967926025390625, 0.3299980163574219, 0.3403167724609375, 0.3506355285644531, 0.36095428466796875, 0.3712730407714844, 0.381591796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 10.0, 16.0, 36.0, 63.0, 99.0, 194.0, 334.0, 739.0, 1841.0, 5987.0, 31854.0, 274944.0, 600614.0, 111402.0, 14493.0, 3461.0, 1262.0, 562.0, 279.0, 139.0, 81.0, 39.0, 30.0, 17.0, 10.0, 8.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15625, -0.15169334411621094, -0.14713668823242188, -0.1425800323486328, -0.13802337646484375, -0.1334667205810547, -0.12891006469726562, -0.12435340881347656, -0.1197967529296875, -0.11524009704589844, -0.11068344116210938, -0.10612678527832031, -0.10157012939453125, -0.09701347351074219, -0.09245681762695312, -0.08790016174316406, -0.083343505859375, -0.07878684997558594, -0.07423019409179688, -0.06967353820800781, -0.06511688232421875, -0.06056022644042969, -0.056003570556640625, -0.05144691467285156, -0.0468902587890625, -0.04233360290527344, -0.037776947021484375, -0.03322029113769531, -0.02866363525390625, -0.024106979370117188, -0.019550323486328125, -0.014993667602539062, -0.01043701171875, -0.0058803558349609375, -0.001323699951171875, 0.0032329559326171875, 0.00778961181640625, 0.012346267700195312, 0.016902923583984375, 0.021459579467773438, 0.0260162353515625, 0.030572891235351562, 0.035129547119140625, 0.03968620300292969, 0.04424285888671875, 0.04879951477050781, 0.053356170654296875, 0.05791282653808594, 0.062469482421875, 0.06702613830566406, 0.07158279418945312, 0.07613945007324219, 0.08069610595703125, 0.08525276184082031, 0.08980941772460938, 0.09436607360839844, 0.0989227294921875, 0.10347938537597656, 0.10803604125976562, 0.11259269714355469, 0.11714935302734375, 0.12170600891113281, 0.12626266479492188, 0.13081932067871094, 0.1353759765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 11.0, 13.0, 23.0, 38.0, 74.0, 139.0, 196.0, 173.0, 135.0, 90.0, 43.0, 32.0, 17.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019407272338867188, -0.00018336623907089233, -0.0001726597547531128, -0.00016195327043533325, -0.0001512467861175537, -0.00014054030179977417, -0.00012983381748199463, -0.00011912733316421509, -0.00010842084884643555, -9.7714364528656e-05, -8.700788021087646e-05, -7.630139589309692e-05, -6.559491157531738e-05, -5.488842725753784e-05, -4.41819429397583e-05, -3.347545862197876e-05, -2.276897430419922e-05, -1.2062489986419678e-05, -1.3560056686401367e-06, 9.350478649139404e-06, 2.0056962966918945e-05, 3.0763447284698486e-05, 4.146993160247803e-05, 5.217641592025757e-05, 6.288290023803711e-05, 7.358938455581665e-05, 8.429586887359619e-05, 9.500235319137573e-05, 0.00010570883750915527, 0.00011641532182693481, 0.00012712180614471436, 0.0001378282904624939, 0.00014853477478027344, 0.00015924125909805298, 0.00016994774341583252, 0.00018065422773361206, 0.0001913607120513916, 0.00020206719636917114, 0.00021277368068695068, 0.00022348016500473022, 0.00023418664932250977, 0.0002448931336402893, 0.00025559961795806885, 0.0002663061022758484, 0.00027701258659362793, 0.00028771907091140747, 0.000298425555229187, 0.00030913203954696655, 0.0003198385238647461, 0.00033054500818252563, 0.0003412514925003052, 0.0003519579768180847, 0.00036266446113586426, 0.0003733709454536438, 0.00038407742977142334, 0.0003947839140892029, 0.0004054903984069824, 0.00041619688272476196, 0.0004269033670425415, 0.00043760985136032104, 0.0004483163356781006, 0.0004590228199958801, 0.00046972930431365967, 0.0004804357886314392, 0.0004911422729492188]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 6.0, 4.0, 11.0, 23.0, 26.0, 51.0, 87.0, 171.0, 351.0, 722.0, 2108.0, 7758.0, 44707.0, 397484.0, 515370.0, 65506.0, 9868.0, 2593.0, 859.0, 404.0, 188.0, 103.0, 45.0, 28.0, 16.0, 14.0, 10.0, 9.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14750289916992188, -0.14290618896484375, -0.13830947875976562, -0.1337127685546875, -0.12911605834960938, -0.12451934814453125, -0.11992263793945312, -0.115325927734375, -0.11072921752929688, -0.10613250732421875, -0.10153579711914062, -0.0969390869140625, -0.09234237670898438, -0.08774566650390625, -0.08314895629882812, -0.07855224609375, -0.07395553588867188, -0.06935882568359375, -0.06476211547851562, -0.0601654052734375, -0.055568695068359375, -0.05097198486328125, -0.046375274658203125, -0.041778564453125, -0.037181854248046875, -0.03258514404296875, -0.027988433837890625, -0.0233917236328125, -0.018795013427734375, -0.01419830322265625, -0.009601593017578125, -0.0050048828125, -0.000408172607421875, 0.00418853759765625, 0.008785247802734375, 0.0133819580078125, 0.017978668212890625, 0.02257537841796875, 0.027172088623046875, 0.031768798828125, 0.036365509033203125, 0.04096221923828125, 0.045558929443359375, 0.0501556396484375, 0.054752349853515625, 0.05934906005859375, 0.06394577026367188, 0.06854248046875, 0.07313919067382812, 0.07773590087890625, 0.08233261108398438, 0.0869293212890625, 0.09152603149414062, 0.09612274169921875, 0.10071945190429688, 0.105316162109375, 0.10991287231445312, 0.11450958251953125, 0.11910629272460938, 0.1237030029296875, 0.12829971313476562, 0.13289642333984375, 0.13749313354492188, 0.14208984375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 10.0, 14.0, 26.0, 29.0, 41.0, 71.0, 97.0, 117.0, 113.0, 121.0, 104.0, 71.0, 48.0, 37.0, 39.0, 20.0, 7.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1005859375, -0.09651374816894531, -0.09244155883789062, -0.08836936950683594, -0.08429718017578125, -0.08022499084472656, -0.07615280151367188, -0.07208061218261719, -0.0680084228515625, -0.06393623352050781, -0.059864044189453125, -0.05579185485839844, -0.05171966552734375, -0.04764747619628906, -0.043575286865234375, -0.03950309753417969, -0.035430908203125, -0.03135871887207031, -0.027286529541015625, -0.023214340209960938, -0.01914215087890625, -0.015069961547851562, -0.010997772216796875, -0.0069255828857421875, -0.0028533935546875, 0.0012187957763671875, 0.005290985107421875, 0.009363174438476562, 0.01343536376953125, 0.017507553100585938, 0.021579742431640625, 0.025651931762695312, 0.02972412109375, 0.03379631042480469, 0.037868499755859375, 0.04194068908691406, 0.04601287841796875, 0.05008506774902344, 0.054157257080078125, 0.05822944641113281, 0.0623016357421875, 0.06637382507324219, 0.07044601440429688, 0.07451820373535156, 0.07859039306640625, 0.08266258239746094, 0.08673477172851562, 0.09080696105957031, 0.094879150390625, 0.09895133972167969, 0.10302352905273438, 0.10709571838378906, 0.11116790771484375, 0.11524009704589844, 0.11931228637695312, 0.12338447570800781, 0.1274566650390625, 0.1315288543701172, 0.13560104370117188, 0.13967323303222656, 0.14374542236328125, 0.14781761169433594, 0.15188980102539062, 0.1559619903564453, 0.1600341796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 9.0, 13.0, 15.0, 25.0, 48.0, 87.0, 184.0, 222.0, 194.0, 98.0, 52.0, 23.0, 15.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.639617919921875, -2.558884859085083, -2.478151798248291, -2.397418737411499, -2.316685676574707, -2.235952615737915, -2.155219554901123, -2.074486255645752, -1.9937533140182495, -1.9130202531814575, -1.8322871923446655, -1.7515541315078735, -1.670820951461792, -1.590087890625, -1.509354829788208, -1.428621768951416, -1.347888708114624, -1.267155647277832, -1.18642258644104, -1.105689525604248, -1.024956464767456, -0.9442233443260193, -0.8634902238845825, -0.7827571630477905, -0.7020241022109985, -0.6212910413742065, -0.5405579805374146, -0.4598248600959778, -0.3790917992591858, -0.2983587384223938, -0.21762564778327942, -0.13689255714416504, -0.056159257888793945, 0.02457381784915924, 0.10530689358711243, 0.1860399693250656, 0.2667730450630188, 0.3475061058998108, 0.42823919653892517, 0.5089722871780396, 0.5897053480148315, 0.6704384088516235, 0.7511714696884155, 0.8319045901298523, 0.9126376509666443, 0.9933707118034363, 1.074103832244873, 1.154836893081665, 1.235569953918457, 1.316303014755249, 1.397036075592041, 1.477769136428833, 1.558502197265625, 1.639235258102417, 1.7199684381484985, 1.8007014989852905, 1.8814345598220825, 1.9621676206588745, 2.042900800704956, 2.123633861541748, 2.20436692237854, 2.285099983215332, 2.365833044052124, 2.446566104888916, 2.527299165725708]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 10.0, 8.0, 9.0, 20.0, 22.0, 19.0, 28.0, 38.0, 41.0, 39.0, 54.0, 48.0, 61.0, 72.0, 65.0, 75.0, 55.0, 55.0, 56.0, 48.0, 37.0, 30.0, 22.0, 18.0, 15.0, 21.0, 15.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.3562161922454834, -2.291783332824707, -2.2273507118225098, -2.1629178524017334, -2.098484992980957, -2.0340521335601807, -1.9696193933486938, -1.905186653137207, -1.8407537937164307, -1.7763209342956543, -1.7118881940841675, -1.6474554538726807, -1.5830225944519043, -1.518589735031128, -1.4541569948196411, -1.3897242546081543, -1.325291395187378, -1.2608585357666016, -1.1964257955551147, -1.131993055343628, -1.0675601959228516, -1.0031273365020752, -0.9386945962905884, -0.8742617964744568, -0.8098289966583252, -0.7453961968421936, -0.680963397026062, -0.6165305972099304, -0.5520977973937988, -0.48766499757766724, -0.42323219776153564, -0.35879939794540405, -0.29436659812927246, -0.22993379831314087, -0.16550099849700928, -0.10106819868087769, -0.036635398864746094, 0.027797400951385498, 0.09223020076751709, 0.15666300058364868, 0.22109580039978027, 0.28552860021591187, 0.34996140003204346, 0.41439419984817505, 0.47882699966430664, 0.5432597994804382, 0.6076925992965698, 0.6721253991127014, 0.736558198928833, 0.8009909987449646, 0.8654237985610962, 0.9298565983772278, 0.9942893981933594, 1.0587222576141357, 1.1231549978256226, 1.1875877380371094, 1.2520205974578857, 1.316453456878662, 1.380886197090149, 1.4453189373016357, 1.509751796722412, 1.5741846561431885, 1.6386173963546753, 1.703050136566162, 1.7674829959869385]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 7.0, 12.0, 24.0, 43.0, 122.0, 297.0, 786.0, 4169.0, 197155.0, 3980725.0, 8616.0, 1326.0, 487.0, 227.0, 116.0, 61.0, 30.0, 23.0, 18.0, 18.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96240234375, -0.9121170043945312, -0.8618316650390625, -0.8115463256835938, -0.761260986328125, -0.7109756469726562, -0.6606903076171875, -0.6104049682617188, -0.56011962890625, -0.5098342895507812, -0.4595489501953125, -0.40926361083984375, -0.358978271484375, -0.30869293212890625, -0.2584075927734375, -0.20812225341796875, -0.1578369140625, -0.10755157470703125, -0.0572662353515625, -0.00698089599609375, 0.043304443359375, 0.09358978271484375, 0.1438751220703125, 0.19416046142578125, 0.24444580078125, 0.29473114013671875, 0.3450164794921875, 0.39530181884765625, 0.445587158203125, 0.49587249755859375, 0.5461578369140625, 0.5964431762695312, 0.646728515625, 0.6970138549804688, 0.7472991943359375, 0.7975845336914062, 0.847869873046875, 0.8981552124023438, 0.9484405517578125, 0.9987258911132812, 1.04901123046875, 1.0992965698242188, 1.1495819091796875, 1.1998672485351562, 1.250152587890625, 1.3004379272460938, 1.3507232666015625, 1.4010086059570312, 1.4512939453125, 1.5015792846679688, 1.5518646240234375, 1.6021499633789062, 1.652435302734375, 1.7027206420898438, 1.7530059814453125, 1.8032913208007812, 1.85357666015625, 1.9038619995117188, 1.9541473388671875, 2.0044326782226562, 2.054718017578125, 2.1050033569335938, 2.1552886962890625, 2.2055740356445312, 2.255859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 17.0, 32.0, 67.0, 105.0, 144.0, 144.0, 140.0, 138.0, 102.0, 62.0, 31.0, 18.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180419921875, -0.1722259521484375, -0.164031982421875, -0.1558380126953125, -0.14764404296875, -0.1394500732421875, -0.131256103515625, -0.1230621337890625, -0.1148681640625, -0.1066741943359375, -0.098480224609375, -0.0902862548828125, -0.08209228515625, -0.0738983154296875, -0.065704345703125, -0.0575103759765625, -0.04931640625, -0.0411224365234375, -0.032928466796875, -0.0247344970703125, -0.01654052734375, -0.0083465576171875, -0.000152587890625, 0.0080413818359375, 0.0162353515625, 0.0244293212890625, 0.032623291015625, 0.0408172607421875, 0.04901123046875, 0.0572052001953125, 0.065399169921875, 0.0735931396484375, 0.081787109375, 0.0899810791015625, 0.098175048828125, 0.1063690185546875, 0.11456298828125, 0.1227569580078125, 0.130950927734375, 0.1391448974609375, 0.1473388671875, 0.1555328369140625, 0.163726806640625, 0.1719207763671875, 0.18011474609375, 0.1883087158203125, 0.196502685546875, 0.2046966552734375, 0.212890625, 0.2210845947265625, 0.229278564453125, 0.2374725341796875, 0.24566650390625, 0.2538604736328125, 0.262054443359375, 0.2702484130859375, 0.2784423828125, 0.2866363525390625, 0.294830322265625, 0.3030242919921875, 0.31121826171875, 0.3194122314453125, 0.327606201171875, 0.3358001708984375, 0.343994140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 3.0, 8.0, 11.0, 18.0, 30.0, 29.0, 37.0, 45.0, 54.0, 79.0, 130.0, 438.0, 8088.0, 4179044.0, 5613.0, 301.0, 124.0, 72.0, 44.0, 34.0, 20.0, 24.0, 16.0, 7.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59375, -2.516265869140625, -2.43878173828125, -2.361297607421875, -2.2838134765625, -2.206329345703125, -2.12884521484375, -2.051361083984375, -1.973876953125, -1.896392822265625, -1.81890869140625, -1.741424560546875, -1.6639404296875, -1.586456298828125, -1.50897216796875, -1.431488037109375, -1.35400390625, -1.276519775390625, -1.19903564453125, -1.121551513671875, -1.0440673828125, -0.966583251953125, -0.88909912109375, -0.811614990234375, -0.734130859375, -0.656646728515625, -0.57916259765625, -0.501678466796875, -0.4241943359375, -0.346710205078125, -0.26922607421875, -0.191741943359375, -0.1142578125, -0.036773681640625, 0.04071044921875, 0.118194580078125, 0.1956787109375, 0.273162841796875, 0.35064697265625, 0.428131103515625, 0.505615234375, 0.583099365234375, 0.66058349609375, 0.738067626953125, 0.8155517578125, 0.893035888671875, 0.97052001953125, 1.048004150390625, 1.12548828125, 1.202972412109375, 1.28045654296875, 1.357940673828125, 1.4354248046875, 1.512908935546875, 1.59039306640625, 1.667877197265625, 1.745361328125, 1.822845458984375, 1.90032958984375, 1.977813720703125, 2.0552978515625, 2.132781982421875, 2.21026611328125, 2.287750244140625, 2.365234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 10.0, 32.0, 159.0, 3399.0, 407.0, 46.0, 14.0, 4.0, 4.0], "bins": [-1.076171875, -1.0578393936157227, -1.0395069122314453, -1.021174430847168, -1.0028419494628906, -0.9845094680786133, -0.9661769866943359, -0.9478445053100586, -0.9295120239257812, -0.9111795425415039, -0.8928470611572266, -0.8745145797729492, -0.8561820983886719, -0.8378496170043945, -0.8195171356201172, -0.8011846542358398, -0.7828521728515625, -0.7645196914672852, -0.7461872100830078, -0.7278547286987305, -0.7095222473144531, -0.6911897659301758, -0.6728572845458984, -0.6545248031616211, -0.6361923217773438, -0.6178598403930664, -0.5995273590087891, -0.5811948776245117, -0.5628623962402344, -0.544529914855957, -0.5261974334716797, -0.5078649520874023, -0.489532470703125, -0.47119998931884766, -0.4528675079345703, -0.43453502655029297, -0.4162025451660156, -0.3978700637817383, -0.37953758239746094, -0.3612051010131836, -0.34287261962890625, -0.3245401382446289, -0.30620765686035156, -0.2878751754760742, -0.2695426940917969, -0.25121021270751953, -0.2328777313232422, -0.21454524993896484, -0.1962127685546875, -0.17788028717041016, -0.1595478057861328, -0.14121532440185547, -0.12288284301757812, -0.10455036163330078, -0.08621788024902344, -0.0678853988647461, -0.04955291748046875, -0.031220436096191406, -0.012887954711914062, 0.005444526672363281, 0.023777008056640625, 0.04210948944091797, 0.06044197082519531, 0.07877445220947266, 0.09710693359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 30.0, 823.0, 146.0, 11.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.311243057250977, -12.036275863647461, -11.761307716369629, -11.486340522766113, -11.211372375488281, -10.936405181884766, -10.66143798828125, -10.386469841003418, -10.111502647399902, -9.836535453796387, -9.561567306518555, -9.286600112915039, -9.011631965637207, -8.736664772033691, -8.46169662475586, -8.186729431152344, -7.91176176071167, -7.636794090270996, -7.361826419830322, -7.086858749389648, -6.811891555786133, -6.536923885345459, -6.261956214904785, -5.986988544464111, -5.7120208740234375, -5.437053203582764, -5.16208553314209, -4.887118339538574, -4.6121506690979, -4.337182998657227, -4.062215328216553, -3.787247657775879, -3.512279987335205, -3.2373123168945312, -2.9623448848724365, -2.6873772144317627, -2.412409782409668, -2.137442111968994, -1.8624744415283203, -1.587506890296936, -1.3125393390655518, -1.0375717878341675, -0.7626041769981384, -0.4876365661621094, -0.2126690149307251, 0.06229853630065918, 0.337266206741333, 0.6122337579727173, 0.8872013092041016, 1.1621688604354858, 1.4371364116668701, 1.712104082107544, 1.9870716333389282, 2.2620391845703125, 2.5370068550109863, 2.81197452545166, 3.086941957473755, 3.3619096279144287, 3.6368770599365234, 3.9118447303771973, 4.186812400817871, 4.461779594421387, 4.736747741699219, 5.011714935302734, 5.286682605743408]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 9.0, 43.0, 83.0, 171.0, 241.0, 229.0, 139.0, 58.0, 22.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.085524082183838, -2.99118709564209, -2.8968498706817627, -2.8025128841400146, -2.7081756591796875, -2.6138386726379395, -2.5195016860961914, -2.4251644611358643, -2.330827236175537, -2.236490249633789, -2.142153024673462, -2.047816038131714, -1.9534788131713867, -1.8591418266296387, -1.764804720878601, -1.6704676151275635, -1.5761306285858154, -1.4817935228347778, -1.3874564170837402, -1.2931194305419922, -1.198782205581665, -1.104445219039917, -1.0101081132888794, -0.9157710075378418, -0.8214339017868042, -0.7270967960357666, -0.632759690284729, -0.5384226441383362, -0.4440855383872986, -0.349748432636261, -0.25541138648986816, -0.16107428073883057, -0.06673693656921387, 0.027600154280662537, 0.12193724513053894, 0.21627432107925415, 0.31061142683029175, 0.40494853258132935, 0.49928557872772217, 0.5936226844787598, 0.6879597902297974, 0.782296895980835, 0.8766340017318726, 0.9709710478782654, 1.0653080940246582, 1.1596453189849854, 1.2539823055267334, 1.348319411277771, 1.4426565170288086, 1.5369936227798462, 1.6313307285308838, 1.7256677150726318, 1.820004940032959, 1.914341926574707, 2.008678913116455, 2.1030161380767822, 2.1973533630371094, 2.2916903495788574, 2.3860275745391846, 2.4803645610809326, 2.5747017860412598, 2.669038772583008, 2.763375759124756, 2.857712984085083, 2.952049970626831]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 5.0, 7.0, 5.0, 9.0, 13.0, 23.0, 29.0, 33.0, 40.0, 72.0, 102.0, 132.0, 192.0, 309.0, 548.0, 1069.0, 2643.0, 8909.0, 47131.0, 394717.0, 513222.0, 62248.0, 11074.0, 3083.0, 1232.0, 633.0, 378.0, 189.0, 144.0, 98.0, 59.0, 55.0, 42.0, 34.0, 23.0, 9.0, 7.0, 11.0, 4.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302734375, -0.5137405395507812, -0.4972076416015625, -0.48067474365234375, -0.464141845703125, -0.44760894775390625, -0.4310760498046875, -0.41454315185546875, -0.39801025390625, -0.38147735595703125, -0.3649444580078125, -0.34841156005859375, -0.331878662109375, -0.31534576416015625, -0.2988128662109375, -0.28227996826171875, -0.2657470703125, -0.24921417236328125, -0.2326812744140625, -0.21614837646484375, -0.199615478515625, -0.18308258056640625, -0.1665496826171875, -0.15001678466796875, -0.13348388671875, -0.11695098876953125, -0.1004180908203125, -0.08388519287109375, -0.067352294921875, -0.05081939697265625, -0.0342864990234375, -0.01775360107421875, -0.001220703125, 0.01531219482421875, 0.0318450927734375, 0.04837799072265625, 0.064910888671875, 0.08144378662109375, 0.0979766845703125, 0.11450958251953125, 0.13104248046875, 0.14757537841796875, 0.1641082763671875, 0.18064117431640625, 0.197174072265625, 0.21370697021484375, 0.2302398681640625, 0.24677276611328125, 0.2633056640625, 0.27983856201171875, 0.2963714599609375, 0.31290435791015625, 0.329437255859375, 0.34597015380859375, 0.3625030517578125, 0.37903594970703125, 0.39556884765625, 0.41210174560546875, 0.4286346435546875, 0.44516754150390625, 0.461700439453125, 0.47823333740234375, 0.4947662353515625, 0.5112991333007812, 0.52783203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 12.0, 13.0, 24.0, 51.0, 80.0, 75.0, 120.0, 114.0, 138.0, 121.0, 98.0, 79.0, 34.0, 24.0, 13.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17172622680664062, -0.16559600830078125, -0.15946578979492188, -0.1533355712890625, -0.14720535278320312, -0.14107513427734375, -0.13494491577148438, -0.128814697265625, -0.12268447875976562, -0.11655426025390625, -0.11042404174804688, -0.1042938232421875, -0.09816360473632812, -0.09203338623046875, -0.08590316772460938, -0.07977294921875, -0.07364273071289062, -0.06751251220703125, -0.061382293701171875, -0.0552520751953125, -0.049121856689453125, -0.04299163818359375, -0.036861419677734375, -0.030731201171875, -0.024600982666015625, -0.01847076416015625, -0.012340545654296875, -0.0062103271484375, -8.0108642578125e-05, 0.00605010986328125, 0.012180328369140625, 0.018310546875, 0.024440765380859375, 0.03057098388671875, 0.036701202392578125, 0.0428314208984375, 0.048961639404296875, 0.05509185791015625, 0.061222076416015625, 0.067352294921875, 0.07348251342773438, 0.07961273193359375, 0.08574295043945312, 0.0918731689453125, 0.09800338745117188, 0.10413360595703125, 0.11026382446289062, 0.11639404296875, 0.12252426147460938, 0.12865447998046875, 0.13478469848632812, 0.1409149169921875, 0.14704513549804688, 0.15317535400390625, 0.15930557250976562, 0.165435791015625, 0.17156600952148438, 0.17769622802734375, 0.18382644653320312, 0.1899566650390625, 0.19608688354492188, 0.20221710205078125, 0.20834732055664062, 0.2144775390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 18.0, 12.0, 22.0, 30.0, 48.0, 64.0, 78.0, 124.0, 185.0, 337.0, 536.0, 995.0, 2011.0, 4528.0, 11690.0, 33327.0, 114192.0, 420331.0, 332558.0, 84531.0, 25815.0, 9425.0, 3823.0, 1651.0, 861.0, 477.0, 291.0, 179.0, 109.0, 90.0, 55.0, 30.0, 33.0, 16.0, 13.0, 14.0, 8.0, 10.0, 1.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2506828308105469, -0.24282073974609375, -0.23495864868164062, -0.2270965576171875, -0.21923446655273438, -0.21137237548828125, -0.20351028442382812, -0.195648193359375, -0.18778610229492188, -0.17992401123046875, -0.17206192016601562, -0.1641998291015625, -0.15633773803710938, -0.14847564697265625, -0.14061355590820312, -0.13275146484375, -0.12488937377929688, -0.11702728271484375, -0.10916519165039062, -0.1013031005859375, -0.09344100952148438, -0.08557891845703125, -0.07771682739257812, -0.069854736328125, -0.061992645263671875, -0.05413055419921875, -0.046268463134765625, -0.0384063720703125, -0.030544281005859375, -0.02268218994140625, -0.014820098876953125, -0.0069580078125, 0.000904083251953125, 0.00876617431640625, 0.016628265380859375, 0.0244903564453125, 0.032352447509765625, 0.04021453857421875, 0.048076629638671875, 0.055938720703125, 0.06380081176757812, 0.07166290283203125, 0.07952499389648438, 0.0873870849609375, 0.09524917602539062, 0.10311126708984375, 0.11097335815429688, 0.11883544921875, 0.12669754028320312, 0.13455963134765625, 0.14242172241210938, 0.1502838134765625, 0.15814590454101562, 0.16600799560546875, 0.17387008666992188, 0.181732177734375, 0.18959426879882812, 0.19745635986328125, 0.20531845092773438, 0.2131805419921875, 0.22104263305664062, 0.22890472412109375, 0.23676681518554688, 0.24462890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 6.0, 8.0, 6.0, 6.0, 15.0, 14.0, 17.0, 21.0, 15.0, 29.0, 32.0, 27.0, 41.0, 45.0, 43.0, 33.0, 61.0, 50.0, 44.0, 35.0, 55.0, 42.0, 42.0, 36.0, 30.0, 29.0, 28.0, 30.0, 24.0, 22.0, 17.0, 21.0, 20.0, 7.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.306396484375, -0.2976531982421875, -0.288909912109375, -0.2801666259765625, -0.27142333984375, -0.2626800537109375, -0.253936767578125, -0.2451934814453125, -0.2364501953125, -0.2277069091796875, -0.218963623046875, -0.2102203369140625, -0.20147705078125, -0.1927337646484375, -0.183990478515625, -0.1752471923828125, -0.16650390625, -0.1577606201171875, -0.149017333984375, -0.1402740478515625, -0.13153076171875, -0.1227874755859375, -0.114044189453125, -0.1053009033203125, -0.0965576171875, -0.0878143310546875, -0.079071044921875, -0.0703277587890625, -0.06158447265625, -0.0528411865234375, -0.044097900390625, -0.0353546142578125, -0.026611328125, -0.0178680419921875, -0.009124755859375, -0.0003814697265625, 0.00836181640625, 0.0171051025390625, 0.025848388671875, 0.0345916748046875, 0.0433349609375, 0.0520782470703125, 0.060821533203125, 0.0695648193359375, 0.07830810546875, 0.0870513916015625, 0.095794677734375, 0.1045379638671875, 0.11328125, 0.1220245361328125, 0.130767822265625, 0.1395111083984375, 0.14825439453125, 0.1569976806640625, 0.165740966796875, 0.1744842529296875, 0.1832275390625, 0.1919708251953125, 0.200714111328125, 0.2094573974609375, 0.21820068359375, 0.2269439697265625, 0.235687255859375, 0.2444305419921875, 0.253173828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 13.0, 20.0, 32.0, 81.0, 131.0, 327.0, 906.0, 3290.0, 23366.0, 405674.0, 572100.0, 36529.0, 4228.0, 1107.0, 398.0, 162.0, 79.0, 36.0, 19.0, 20.0, 6.0, 9.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.259521484375, -0.2537651062011719, -0.24800872802734375, -0.24225234985351562, -0.2364959716796875, -0.23073959350585938, -0.22498321533203125, -0.21922683715820312, -0.213470458984375, -0.20771408081054688, -0.20195770263671875, -0.19620132446289062, -0.1904449462890625, -0.18468856811523438, -0.17893218994140625, -0.17317581176757812, -0.16741943359375, -0.16166305541992188, -0.15590667724609375, -0.15015029907226562, -0.1443939208984375, -0.13863754272460938, -0.13288116455078125, -0.12712478637695312, -0.121368408203125, -0.11561203002929688, -0.10985565185546875, -0.10409927368164062, -0.0983428955078125, -0.09258651733398438, -0.08683013916015625, -0.08107376098632812, -0.0753173828125, -0.06956100463867188, -0.06380462646484375, -0.058048248291015625, -0.0522918701171875, -0.046535491943359375, -0.04077911376953125, -0.035022735595703125, -0.029266357421875, -0.023509979248046875, -0.01775360107421875, -0.011997222900390625, -0.0062408447265625, -0.000484466552734375, 0.00527191162109375, 0.011028289794921875, 0.01678466796875, 0.022541046142578125, 0.02829742431640625, 0.034053802490234375, 0.0398101806640625, 0.045566558837890625, 0.05132293701171875, 0.057079315185546875, 0.062835693359375, 0.06859207153320312, 0.07434844970703125, 0.08010482788085938, 0.0858612060546875, 0.09161758422851562, 0.09737396240234375, 0.10313034057617188, 0.10888671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 9.0, 15.0, 13.0, 18.0, 27.0, 36.0, 34.0, 49.0, 85.0, 93.0, 102.0, 101.0, 98.0, 81.0, 51.0, 57.0, 30.0, 36.0, 16.0, 13.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022554397583007812, -0.0002199411392211914, -0.0002143383026123047, -0.00020873546600341797, -0.00020313262939453125, -0.00019752979278564453, -0.0001919269561767578, -0.0001863241195678711, -0.00018072128295898438, -0.00017511844635009766, -0.00016951560974121094, -0.00016391277313232422, -0.0001583099365234375, -0.00015270709991455078, -0.00014710426330566406, -0.00014150142669677734, -0.00013589859008789062, -0.0001302957534790039, -0.0001246929168701172, -0.00011909008026123047, -0.00011348724365234375, -0.00010788440704345703, -0.00010228157043457031, -9.66787338256836e-05, -9.107589721679688e-05, -8.547306060791016e-05, -7.987022399902344e-05, -7.426738739013672e-05, -6.866455078125e-05, -6.306171417236328e-05, -5.745887756347656e-05, -5.1856040954589844e-05, -4.6253204345703125e-05, -4.0650367736816406e-05, -3.504753112792969e-05, -2.944469451904297e-05, -2.384185791015625e-05, -1.823902130126953e-05, -1.2636184692382812e-05, -7.033348083496094e-06, -1.430511474609375e-06, 4.172325134277344e-06, 9.775161743164062e-06, 1.537799835205078e-05, 2.09808349609375e-05, 2.658367156982422e-05, 3.218650817871094e-05, 3.7789344787597656e-05, 4.3392181396484375e-05, 4.8995018005371094e-05, 5.459785461425781e-05, 6.020069122314453e-05, 6.580352783203125e-05, 7.140636444091797e-05, 7.700920104980469e-05, 8.26120376586914e-05, 8.821487426757812e-05, 9.381771087646484e-05, 9.942054748535156e-05, 0.00010502338409423828, 0.000110626220703125, 0.00011622905731201172, 0.00012183189392089844, 0.00012743473052978516, 0.00013303756713867188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 9.0, 18.0, 36.0, 76.0, 157.0, 334.0, 831.0, 2467.0, 11892.0, 145975.0, 752602.0, 119803.0, 10574.0, 2339.0, 826.0, 290.0, 130.0, 73.0, 46.0, 17.0, 13.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19482421875, -0.1894817352294922, -0.18413925170898438, -0.17879676818847656, -0.17345428466796875, -0.16811180114746094, -0.16276931762695312, -0.1574268341064453, -0.1520843505859375, -0.1467418670654297, -0.14139938354492188, -0.13605690002441406, -0.13071441650390625, -0.12537193298339844, -0.12002944946289062, -0.11468696594238281, -0.109344482421875, -0.10400199890136719, -0.09865951538085938, -0.09331703186035156, -0.08797454833984375, -0.08263206481933594, -0.07728958129882812, -0.07194709777832031, -0.0666046142578125, -0.06126213073730469, -0.055919647216796875, -0.05057716369628906, -0.04523468017578125, -0.03989219665527344, -0.034549713134765625, -0.029207229614257812, -0.02386474609375, -0.018522262573242188, -0.013179779052734375, -0.007837295532226562, -0.00249481201171875, 0.0028476715087890625, 0.008190155029296875, 0.013532638549804688, 0.0188751220703125, 0.024217605590820312, 0.029560089111328125, 0.03490257263183594, 0.04024505615234375, 0.04558753967285156, 0.050930023193359375, 0.05627250671386719, 0.061614990234375, 0.06695747375488281, 0.07229995727539062, 0.07764244079589844, 0.08298492431640625, 0.08832740783691406, 0.09366989135742188, 0.09901237487792969, 0.1043548583984375, 0.10969734191894531, 0.11503982543945312, 0.12038230895996094, 0.12572479248046875, 0.13106727600097656, 0.13640975952148438, 0.1417522430419922, 0.1470947265625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 16.0, 23.0, 44.0, 48.0, 78.0, 94.0, 108.0, 137.0, 107.0, 78.0, 82.0, 57.0, 38.0, 18.0, 22.0, 12.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.1376953125, -0.1342153549194336, -0.1307353973388672, -0.12725543975830078, -0.12377548217773438, -0.12029552459716797, -0.11681556701660156, -0.11333560943603516, -0.10985565185546875, -0.10637569427490234, -0.10289573669433594, -0.09941577911376953, -0.09593582153320312, -0.09245586395263672, -0.08897590637207031, -0.0854959487915039, -0.0820159912109375, -0.0785360336303711, -0.07505607604980469, -0.07157611846923828, -0.06809616088867188, -0.06461620330810547, -0.06113624572753906, -0.057656288146972656, -0.05417633056640625, -0.050696372985839844, -0.04721641540527344, -0.04373645782470703, -0.040256500244140625, -0.03677654266357422, -0.03329658508300781, -0.029816627502441406, -0.026336669921875, -0.022856712341308594, -0.019376754760742188, -0.01589679718017578, -0.012416839599609375, -0.008936882019042969, -0.0054569244384765625, -0.0019769668579101562, 0.00150299072265625, 0.004982948303222656, 0.008462905883789062, 0.011942863464355469, 0.015422821044921875, 0.01890277862548828, 0.022382736206054688, 0.025862693786621094, 0.0293426513671875, 0.032822608947753906, 0.03630256652832031, 0.03978252410888672, 0.043262481689453125, 0.04674243927001953, 0.05022239685058594, 0.053702354431152344, 0.05718231201171875, 0.060662269592285156, 0.06414222717285156, 0.06762218475341797, 0.07110214233398438, 0.07458209991455078, 0.07806205749511719, 0.0815420150756836, 0.08502197265625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 18.0, 41.0, 96.0, 224.0, 334.0, 181.0, 59.0, 19.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9431120157241821, -1.8247101306915283, -1.7063082456588745, -1.5879063606262207, -1.469504475593567, -1.351102590560913, -1.2327005863189697, -1.1142988204956055, -0.9958968758583069, -0.8774949908256531, -0.7590931057929993, -0.6406911611557007, -0.5222892761230469, -0.40388739109039307, -0.28548550605773926, -0.16708362102508545, -0.04868173599243164, 0.06972015649080276, 0.18812204897403717, 0.3065239489078522, 0.424925833940506, 0.5433277487754822, 0.661729633808136, 0.7801315188407898, 0.8985334038734436, 1.0169353485107422, 1.135337233543396, 1.2537391185760498, 1.3721410036087036, 1.4905428886413574, 1.6089447736740112, 1.727346658706665, 1.8457486629486084, 1.9641505479812622, 2.082552433013916, 2.2009544372558594, 2.3193562030792236, 2.437758207321167, 2.5561599731445312, 2.6745619773864746, 2.792963743209839, 2.9113657474517822, 3.0297675132751465, 3.14816951751709, 3.266571283340454, 3.3849732875823975, 3.5033750534057617, 3.621777057647705, 3.7401790618896484, 3.858581066131592, 3.976982831954956, 4.09538459777832, 4.213786602020264, 4.332188606262207, 4.45059061050415, 4.5689921379089355, 4.687394142150879, 4.805796146392822, 4.924198150634766, 5.042599678039551, 5.161001682281494, 5.2794036865234375, 5.397805690765381, 5.516207218170166, 5.634609222412109]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 10.0, 11.0, 11.0, 17.0, 10.0, 24.0, 15.0, 26.0, 31.0, 31.0, 26.0, 38.0, 38.0, 42.0, 45.0, 62.0, 42.0, 42.0, 42.0, 50.0, 38.0, 29.0, 38.0, 30.0, 33.0, 23.0, 30.0, 23.0, 15.0, 16.0, 10.0, 17.0, 15.0, 11.0, 5.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.556401014328003, -1.510414481163025, -1.4644279479980469, -1.4184414148330688, -1.3724548816680908, -1.3264684677124023, -1.2804818153381348, -1.2344954013824463, -1.1885088682174683, -1.1425223350524902, -1.0965358018875122, -1.0505492687225342, -1.0045627355575562, -0.9585762619972229, -0.9125897288322449, -0.8666032552719116, -0.8206166625022888, -0.7746301293373108, -0.7286435961723328, -0.6826571226119995, -0.6366705894470215, -0.5906840562820435, -0.5446975231170654, -0.4987110197544098, -0.45272448658943176, -0.40673795342445374, -0.3607514500617981, -0.31476491689682007, -0.26877838373184204, -0.2227918803691864, -0.17680534720420837, -0.13081884384155273, -0.08483231067657471, -0.038845788687467575, 0.007140733301639557, 0.05312725901603699, 0.09911377727985382, 0.14510029554367065, 0.19108682870864868, 0.23707333207130432, 0.28305986523628235, 0.3290463984012604, 0.375032901763916, 0.42101943492889404, 0.46700596809387207, 0.5129925012588501, 0.5589790344238281, 0.6049655079841614, 0.6509520411491394, 0.6969385743141174, 0.7429251074790955, 0.7889115810394287, 0.8348981142044067, 0.8808846473693848, 0.9268711805343628, 0.9728577136993408, 1.0188442468643188, 1.0648307800292969, 1.110817313194275, 1.156803846359253, 1.202790379524231, 1.248776912689209, 1.2947633266448975, 1.3407498598098755, 1.3867363929748535]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 9.0, 18.0, 34.0, 57.0, 125.0, 335.0, 1072.0, 8690.0, 4060158.0, 119018.0, 3427.0, 786.0, 272.0, 130.0, 67.0, 40.0, 16.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.3639678955078125, -1.308990478515625, -1.2540130615234375, -1.19903564453125, -1.1440582275390625, -1.089080810546875, -1.0341033935546875, -0.9791259765625, -0.9241485595703125, -0.869171142578125, -0.8141937255859375, -0.75921630859375, -0.7042388916015625, -0.649261474609375, -0.5942840576171875, -0.539306640625, -0.4843292236328125, -0.429351806640625, -0.3743743896484375, -0.31939697265625, -0.2644195556640625, -0.209442138671875, -0.1544647216796875, -0.0994873046875, -0.0445098876953125, 0.010467529296875, 0.0654449462890625, 0.12042236328125, 0.1753997802734375, 0.230377197265625, 0.2853546142578125, 0.34033203125, 0.3953094482421875, 0.450286865234375, 0.5052642822265625, 0.56024169921875, 0.6152191162109375, 0.670196533203125, 0.7251739501953125, 0.7801513671875, 0.8351287841796875, 0.890106201171875, 0.9450836181640625, 1.00006103515625, 1.0550384521484375, 1.110015869140625, 1.1649932861328125, 1.219970703125, 1.2749481201171875, 1.329925537109375, 1.3849029541015625, 1.43988037109375, 1.4948577880859375, 1.549835205078125, 1.6048126220703125, 1.6597900390625, 1.7147674560546875, 1.769744873046875, 1.8247222900390625, 1.87969970703125, 1.9346771240234375, 1.989654541015625, 2.0446319580078125, 2.099609375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 18.0, 16.0, 35.0, 51.0, 76.0, 97.0, 111.0, 124.0, 107.0, 118.0, 92.0, 56.0, 42.0, 32.0, 13.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177978515625, -0.17180252075195312, -0.16562652587890625, -0.15945053100585938, -0.1532745361328125, -0.14709854125976562, -0.14092254638671875, -0.13474655151367188, -0.128570556640625, -0.12239456176757812, -0.11621856689453125, -0.11004257202148438, -0.1038665771484375, -0.09769058227539062, -0.09151458740234375, -0.08533859252929688, -0.07916259765625, -0.07298660278320312, -0.06681060791015625, -0.060634613037109375, -0.0544586181640625, -0.048282623291015625, -0.04210662841796875, -0.035930633544921875, -0.029754638671875, -0.023578643798828125, -0.01740264892578125, -0.011226654052734375, -0.0050506591796875, 0.001125335693359375, 0.00730133056640625, 0.013477325439453125, 0.0196533203125, 0.025829315185546875, 0.03200531005859375, 0.038181304931640625, 0.0443572998046875, 0.050533294677734375, 0.05670928955078125, 0.06288528442382812, 0.069061279296875, 0.07523727416992188, 0.08141326904296875, 0.08758926391601562, 0.0937652587890625, 0.09994125366210938, 0.10611724853515625, 0.11229324340820312, 0.11846923828125, 0.12464523315429688, 0.13082122802734375, 0.13699722290039062, 0.1431732177734375, 0.14934921264648438, 0.15552520751953125, 0.16170120239257812, 0.167877197265625, 0.17405319213867188, 0.18022918701171875, 0.18640518188476562, 0.1925811767578125, 0.19875717163085938, 0.20493316650390625, 0.21110916137695312, 0.21728515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 6.0, 10.0, 27.0, 50.0, 81.0, 135.0, 261.0, 468.0, 999.0, 2248.0, 6915.0, 56262.0, 3847918.0, 259021.0, 14336.0, 3141.0, 1184.0, 549.0, 287.0, 148.0, 104.0, 55.0, 24.0, 21.0, 7.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.509124755859375, -0.49139404296875, -0.473663330078125, -0.4559326171875, -0.438201904296875, -0.42047119140625, -0.402740478515625, -0.385009765625, -0.367279052734375, -0.34954833984375, -0.331817626953125, -0.3140869140625, -0.296356201171875, -0.27862548828125, -0.260894775390625, -0.2431640625, -0.225433349609375, -0.20770263671875, -0.189971923828125, -0.1722412109375, -0.154510498046875, -0.13677978515625, -0.119049072265625, -0.101318359375, -0.083587646484375, -0.06585693359375, -0.048126220703125, -0.0303955078125, -0.012664794921875, 0.00506591796875, 0.022796630859375, 0.04052734375, 0.058258056640625, 0.07598876953125, 0.093719482421875, 0.1114501953125, 0.129180908203125, 0.14691162109375, 0.164642333984375, 0.182373046875, 0.200103759765625, 0.21783447265625, 0.235565185546875, 0.2532958984375, 0.271026611328125, 0.28875732421875, 0.306488037109375, 0.32421875, 0.341949462890625, 0.35968017578125, 0.377410888671875, 0.3951416015625, 0.412872314453125, 0.43060302734375, 0.448333740234375, 0.466064453125, 0.483795166015625, 0.50152587890625, 0.519256591796875, 0.5369873046875, 0.554718017578125, 0.57244873046875, 0.590179443359375, 0.60791015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 4.0, 7.0, 6.0, 11.0, 19.0, 14.0, 55.0, 105.0, 340.0, 2152.0, 944.0, 228.0, 93.0, 42.0, 20.0, 10.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232666015625, -0.22510910034179688, -0.21755218505859375, -0.20999526977539062, -0.2024383544921875, -0.19488143920898438, -0.18732452392578125, -0.17976760864257812, -0.172210693359375, -0.16465377807617188, -0.15709686279296875, -0.14953994750976562, -0.1419830322265625, -0.13442611694335938, -0.12686920166015625, -0.11931228637695312, -0.11175537109375, -0.10419845581054688, -0.09664154052734375, -0.08908462524414062, -0.0815277099609375, -0.07397079467773438, -0.06641387939453125, -0.058856964111328125, -0.051300048828125, -0.043743133544921875, -0.03618621826171875, -0.028629302978515625, -0.0210723876953125, -0.013515472412109375, -0.00595855712890625, 0.001598358154296875, 0.0091552734375, 0.016712188720703125, 0.02426910400390625, 0.031826019287109375, 0.0393829345703125, 0.046939849853515625, 0.05449676513671875, 0.062053680419921875, 0.069610595703125, 0.07716751098632812, 0.08472442626953125, 0.09228134155273438, 0.0998382568359375, 0.10739517211914062, 0.11495208740234375, 0.12250900268554688, 0.13006591796875, 0.13762283325195312, 0.14517974853515625, 0.15273666381835938, 0.1602935791015625, 0.16785049438476562, 0.17540740966796875, 0.18296432495117188, 0.190521240234375, 0.19807815551757812, 0.20563507080078125, 0.21319198608398438, 0.2207489013671875, 0.22830581665039062, 0.23586273193359375, 0.24341964721679688, 0.2509765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 23.0, 72.0, 290.0, 405.0, 138.0, 43.0, 16.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.630551338195801, -3.556957960128784, -3.4833643436431885, -3.409770965576172, -3.336177349090576, -3.2625839710235596, -3.188990354537964, -3.1153969764709473, -3.0418033599853516, -2.968209981918335, -2.8946163654327393, -2.8210229873657227, -2.747429370880127, -2.6738359928131104, -2.6002423763275146, -2.526648998260498, -2.4530556201934814, -2.379462242126465, -2.305868625640869, -2.2322752475738525, -2.158681631088257, -2.0850882530212402, -2.0114946365356445, -1.937901258468628, -1.8643077611923218, -1.7907142639160156, -1.7171207666397095, -1.6435272693634033, -1.5699338912963867, -1.496340274810791, -1.4227468967437744, -1.3491533994674683, -1.275559902191162, -1.201966404914856, -1.1283729076385498, -1.0547794103622437, -0.9811859726905823, -0.9075924754142761, -0.8339990377426147, -0.7604055404663086, -0.6868120431900024, -0.6132185459136963, -0.5396250486373901, -0.46603161096572876, -0.3924381136894226, -0.31884461641311646, -0.2452511489391327, -0.17165768146514893, -0.09806418418884277, -0.024470701813697815, 0.049122780561447144, 0.1227162629365921, 0.19630974531173706, 0.2699032425880432, 0.343496710062027, 0.41709017753601074, 0.4906836748123169, 0.564277172088623, 0.6378706693649292, 0.7114641070365906, 0.7850576043128967, 0.8586511015892029, 0.9322445392608643, 1.0058380365371704, 1.0794315338134766]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 15.0, 13.0, 17.0, 31.0, 31.0, 45.0, 49.0, 79.0, 85.0, 62.0, 65.0, 66.0, 67.0, 76.0, 54.0, 48.0, 66.0, 29.0, 28.0, 17.0, 15.0, 13.0, 10.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9534122943878174, -0.9284040331840515, -0.9033958315849304, -0.8783875703811646, -0.8533793091773987, -0.8283711075782776, -0.8033628463745117, -0.7783546447753906, -0.7533463835716248, -0.7283381223678589, -0.7033299207687378, -0.6783216595649719, -0.653313398361206, -0.628305196762085, -0.6032969355583191, -0.5782886743545532, -0.5532804727554321, -0.5282722115516663, -0.5032640099525452, -0.4782557487487793, -0.4532475173473358, -0.42823928594589233, -0.40323102474212646, -0.378222793340683, -0.3532145023345947, -0.32820627093315125, -0.3031980097293854, -0.2781897783279419, -0.2531815469264984, -0.22817330062389374, -0.20316505432128906, -0.17815682291984558, -0.1531485915184021, -0.12814034521579742, -0.10313211381435394, -0.07812386751174927, -0.05311562865972519, -0.02810738980770111, -0.0030991435050964355, 0.021909087896347046, 0.04691733419895172, 0.0719255730509758, 0.09693381190299988, 0.12194205820560455, 0.14695030450820923, 0.1719585359096527, 0.19696678221225739, 0.22197501361370087, 0.24698325991630554, 0.271991491317749, 0.2969997525215149, 0.3220079839229584, 0.34701621532440186, 0.3720244765281677, 0.3970327079296112, 0.4220409393310547, 0.44704920053482056, 0.47205743193626404, 0.4970656931400299, 0.5220739245414734, 0.5470821857452393, 0.5720903873443604, 0.5970986485481262, 0.6221069097518921, 0.6471151113510132]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 2.0, 7.0, 8.0, 17.0, 18.0, 33.0, 63.0, 105.0, 168.0, 423.0, 912.0, 2801.0, 13719.0, 295931.0, 703448.0, 24882.0, 3812.0, 1173.0, 498.0, 215.0, 141.0, 57.0, 39.0, 33.0, 11.0, 7.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.869140625, -0.8402938842773438, -0.8114471435546875, -0.7826004028320312, -0.753753662109375, -0.7249069213867188, -0.6960601806640625, -0.6672134399414062, -0.63836669921875, -0.6095199584960938, -0.5806732177734375, -0.5518264770507812, -0.522979736328125, -0.49413299560546875, -0.4652862548828125, -0.43643951416015625, -0.4075927734375, -0.37874603271484375, -0.3498992919921875, -0.32105255126953125, -0.292205810546875, -0.26335906982421875, -0.2345123291015625, -0.20566558837890625, -0.17681884765625, -0.14797210693359375, -0.1191253662109375, -0.09027862548828125, -0.061431884765625, -0.03258514404296875, -0.0037384033203125, 0.02510833740234375, 0.053955078125, 0.08280181884765625, 0.1116485595703125, 0.14049530029296875, 0.169342041015625, 0.19818878173828125, 0.2270355224609375, 0.25588226318359375, 0.28472900390625, 0.31357574462890625, 0.3424224853515625, 0.37126922607421875, 0.400115966796875, 0.42896270751953125, 0.4578094482421875, 0.48665618896484375, 0.5155029296875, 0.5443496704101562, 0.5731964111328125, 0.6020431518554688, 0.630889892578125, 0.6597366333007812, 0.6885833740234375, 0.7174301147460938, 0.74627685546875, 0.7751235961914062, 0.8039703369140625, 0.8328170776367188, 0.861663818359375, 0.8905105590820312, 0.9193572998046875, 0.9482040405273438, 0.97705078125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 11.0, 12.0, 14.0, 32.0, 47.0, 70.0, 87.0, 99.0, 94.0, 116.0, 110.0, 99.0, 70.0, 52.0, 36.0, 29.0, 9.0, 10.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1767578125, -0.1710987091064453, -0.16543960571289062, -0.15978050231933594, -0.15412139892578125, -0.14846229553222656, -0.14280319213867188, -0.1371440887451172, -0.1314849853515625, -0.1258258819580078, -0.12016677856445312, -0.11450767517089844, -0.10884857177734375, -0.10318946838378906, -0.09753036499023438, -0.09187126159667969, -0.086212158203125, -0.08055305480957031, -0.07489395141601562, -0.06923484802246094, -0.06357574462890625, -0.05791664123535156, -0.052257537841796875, -0.04659843444824219, -0.0409393310546875, -0.03528022766113281, -0.029621124267578125, -0.023962020874023438, -0.01830291748046875, -0.012643814086914062, -0.006984710693359375, -0.0013256072998046875, 0.00433349609375, 0.009992599487304688, 0.015651702880859375, 0.021310806274414062, 0.02696990966796875, 0.03262901306152344, 0.038288116455078125, 0.04394721984863281, 0.0496063232421875, 0.05526542663574219, 0.060924530029296875, 0.06658363342285156, 0.07224273681640625, 0.07790184020996094, 0.08356094360351562, 0.08922004699707031, 0.094879150390625, 0.10053825378417969, 0.10619735717773438, 0.11185646057128906, 0.11751556396484375, 0.12317466735839844, 0.12883377075195312, 0.1344928741455078, 0.1401519775390625, 0.1458110809326172, 0.15147018432617188, 0.15712928771972656, 0.16278839111328125, 0.16844749450683594, 0.17410659790039062, 0.1797657012939453, 0.1854248046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 5.0, 12.0, 2.0, 15.0, 15.0, 18.0, 28.0, 45.0, 67.0, 108.0, 156.0, 293.0, 646.0, 1677.0, 5105.0, 20999.0, 158455.0, 730310.0, 107785.0, 16109.0, 4136.0, 1306.0, 525.0, 285.0, 165.0, 93.0, 53.0, 39.0, 23.0, 14.0, 9.0, 8.0, 11.0, 4.0, 4.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.486572265625, -0.4728355407714844, -0.45909881591796875, -0.4453620910644531, -0.4316253662109375, -0.4178886413574219, -0.40415191650390625, -0.3904151916503906, -0.376678466796875, -0.3629417419433594, -0.34920501708984375, -0.3354682922363281, -0.3217315673828125, -0.3079948425292969, -0.29425811767578125, -0.2805213928222656, -0.26678466796875, -0.2530479431152344, -0.23931121826171875, -0.22557449340820312, -0.2118377685546875, -0.19810104370117188, -0.18436431884765625, -0.17062759399414062, -0.156890869140625, -0.14315414428710938, -0.12941741943359375, -0.11568069458007812, -0.1019439697265625, -0.08820724487304688, -0.07447052001953125, -0.060733795166015625, -0.0469970703125, -0.033260345458984375, -0.01952362060546875, -0.005786895751953125, 0.0079498291015625, 0.021686553955078125, 0.03542327880859375, 0.049160003662109375, 0.062896728515625, 0.07663345336914062, 0.09037017822265625, 0.10410690307617188, 0.1178436279296875, 0.13158035278320312, 0.14531707763671875, 0.15905380249023438, 0.17279052734375, 0.18652725219726562, 0.20026397705078125, 0.21400070190429688, 0.2277374267578125, 0.24147415161132812, 0.25521087646484375, 0.2689476013183594, 0.282684326171875, 0.2964210510253906, 0.31015777587890625, 0.3238945007324219, 0.3376312255859375, 0.3513679504394531, 0.36510467529296875, 0.3788414001464844, 0.392578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 11.0, 4.0, 10.0, 15.0, 13.0, 6.0, 25.0, 19.0, 19.0, 37.0, 44.0, 36.0, 46.0, 43.0, 46.0, 59.0, 43.0, 58.0, 45.0, 49.0, 39.0, 50.0, 40.0, 40.0, 24.0, 23.0, 28.0, 19.0, 23.0, 18.0, 8.0, 8.0, 7.0, 9.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.32275390625, -0.31243896484375, -0.3021240234375, -0.29180908203125, -0.281494140625, -0.27117919921875, -0.2608642578125, -0.25054931640625, -0.240234375, -0.22991943359375, -0.2196044921875, -0.20928955078125, -0.198974609375, -0.18865966796875, -0.1783447265625, -0.16802978515625, -0.15771484375, -0.14739990234375, -0.1370849609375, -0.12677001953125, -0.116455078125, -0.10614013671875, -0.0958251953125, -0.08551025390625, -0.0751953125, -0.06488037109375, -0.0545654296875, -0.04425048828125, -0.033935546875, -0.02362060546875, -0.0133056640625, -0.00299072265625, 0.00732421875, 0.01763916015625, 0.0279541015625, 0.03826904296875, 0.048583984375, 0.05889892578125, 0.0692138671875, 0.07952880859375, 0.08984375, 0.10015869140625, 0.1104736328125, 0.12078857421875, 0.131103515625, 0.14141845703125, 0.1517333984375, 0.16204833984375, 0.17236328125, 0.18267822265625, 0.1929931640625, 0.20330810546875, 0.213623046875, 0.22393798828125, 0.2342529296875, 0.24456787109375, 0.2548828125, 0.26519775390625, 0.2755126953125, 0.28582763671875, 0.296142578125, 0.30645751953125, 0.3167724609375, 0.32708740234375, 0.33740234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 12.0, 20.0, 62.0, 210.0, 947.0, 21864.0, 1017566.0, 7075.0, 559.0, 146.0, 48.0, 17.0, 11.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.6359786987304688, -0.6157073974609375, -0.5954360961914062, -0.575164794921875, -0.5548934936523438, -0.5346221923828125, -0.5143508911132812, -0.49407958984375, -0.47380828857421875, -0.4535369873046875, -0.43326568603515625, -0.412994384765625, -0.39272308349609375, -0.3724517822265625, -0.35218048095703125, -0.3319091796875, -0.31163787841796875, -0.2913665771484375, -0.27109527587890625, -0.250823974609375, -0.23055267333984375, -0.2102813720703125, -0.19001007080078125, -0.16973876953125, -0.14946746826171875, -0.1291961669921875, -0.10892486572265625, -0.088653564453125, -0.06838226318359375, -0.0481109619140625, -0.02783966064453125, -0.007568359375, 0.01270294189453125, 0.0329742431640625, 0.05324554443359375, 0.073516845703125, 0.09378814697265625, 0.1140594482421875, 0.13433074951171875, 0.15460205078125, 0.17487335205078125, 0.1951446533203125, 0.21541595458984375, 0.235687255859375, 0.25595855712890625, 0.2762298583984375, 0.29650115966796875, 0.3167724609375, 0.33704376220703125, 0.3573150634765625, 0.37758636474609375, 0.397857666015625, 0.41812896728515625, 0.4384002685546875, 0.45867156982421875, 0.47894287109375, 0.49921417236328125, 0.5194854736328125, 0.5397567749023438, 0.560028076171875, 0.5802993774414062, 0.6005706787109375, 0.6208419799804688, 0.64111328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 15.0, 46.0, 110.0, 212.0, 309.0, 171.0, 85.0, 30.0, 14.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007557868957519531, -0.0007323622703552246, -0.0007089376449584961, -0.0006855130195617676, -0.0006620883941650391, -0.0006386637687683105, -0.000615239143371582, -0.0005918145179748535, -0.000568389892578125, -0.0005449652671813965, -0.000521540641784668, -0.0004981160163879395, -0.00047469139099121094, -0.0004512667655944824, -0.0004278421401977539, -0.0004044175148010254, -0.0003809928894042969, -0.00035756826400756836, -0.00033414363861083984, -0.00031071901321411133, -0.0002872943878173828, -0.0002638697624206543, -0.00024044513702392578, -0.00021702051162719727, -0.00019359588623046875, -0.00017017126083374023, -0.00014674663543701172, -0.0001233220100402832, -9.989738464355469e-05, -7.647275924682617e-05, -5.3048133850097656e-05, -2.962350845336914e-05, -6.198883056640625e-06, 1.722574234008789e-05, 4.0650367736816406e-05, 6.407499313354492e-05, 8.749961853027344e-05, 0.00011092424392700195, 0.00013434886932373047, 0.00015777349472045898, 0.0001811981201171875, 0.00020462274551391602, 0.00022804737091064453, 0.00025147199630737305, 0.00027489662170410156, 0.0002983212471008301, 0.0003217458724975586, 0.0003451704978942871, 0.0003685951232910156, 0.00039201974868774414, 0.00041544437408447266, 0.00043886899948120117, 0.0004622936248779297, 0.0004857182502746582, 0.0005091428756713867, 0.0005325675010681152, 0.0005559921264648438, 0.0005794167518615723, 0.0006028413772583008, 0.0006262660026550293, 0.0006496906280517578, 0.0006731152534484863, 0.0006965398788452148, 0.0007199645042419434, 0.0007433891296386719]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 12.0, 16.0, 35.0, 57.0, 103.0, 138.0, 297.0, 973.0, 24873.0, 1012579.0, 8239.0, 651.0, 244.0, 146.0, 78.0, 51.0, 25.0, 10.0, 8.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65576171875, -0.6377372741699219, -0.6197128295898438, -0.6016883850097656, -0.5836639404296875, -0.5656394958496094, -0.5476150512695312, -0.5295906066894531, -0.511566162109375, -0.4935417175292969, -0.47551727294921875, -0.4574928283691406, -0.4394683837890625, -0.4214439392089844, -0.40341949462890625, -0.3853950500488281, -0.36737060546875, -0.3493461608886719, -0.33132171630859375, -0.3132972717285156, -0.2952728271484375, -0.2772483825683594, -0.25922393798828125, -0.24119949340820312, -0.223175048828125, -0.20515060424804688, -0.18712615966796875, -0.16910171508789062, -0.1510772705078125, -0.13305282592773438, -0.11502838134765625, -0.09700393676757812, -0.0789794921875, -0.060955047607421875, -0.04293060302734375, -0.024906158447265625, -0.0068817138671875, 0.011142730712890625, 0.02916717529296875, 0.047191619873046875, 0.065216064453125, 0.08324050903320312, 0.10126495361328125, 0.11928939819335938, 0.1373138427734375, 0.15533828735351562, 0.17336273193359375, 0.19138717651367188, 0.20941162109375, 0.22743606567382812, 0.24546051025390625, 0.2634849548339844, 0.2815093994140625, 0.2995338439941406, 0.31755828857421875, 0.3355827331542969, 0.353607177734375, 0.3716316223144531, 0.38965606689453125, 0.4076805114746094, 0.4257049560546875, 0.4437294006347656, 0.46175384521484375, 0.4797782897949219, 0.497802734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 14.0, 24.0, 135.0, 455.0, 301.0, 57.0, 14.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5134124755859375, -0.495574951171875, -0.4777374267578125, -0.45989990234375, -0.4420623779296875, -0.424224853515625, -0.4063873291015625, -0.3885498046875, -0.3707122802734375, -0.352874755859375, -0.3350372314453125, -0.31719970703125, -0.2993621826171875, -0.281524658203125, -0.2636871337890625, -0.245849609375, -0.2280120849609375, -0.210174560546875, -0.1923370361328125, -0.17449951171875, -0.1566619873046875, -0.138824462890625, -0.1209869384765625, -0.1031494140625, -0.0853118896484375, -0.067474365234375, -0.0496368408203125, -0.03179931640625, -0.0139617919921875, 0.003875732421875, 0.0217132568359375, 0.03955078125, 0.0573883056640625, 0.075225830078125, 0.0930633544921875, 0.11090087890625, 0.1287384033203125, 0.146575927734375, 0.1644134521484375, 0.1822509765625, 0.2000885009765625, 0.217926025390625, 0.2357635498046875, 0.25360107421875, 0.2714385986328125, 0.289276123046875, 0.3071136474609375, 0.324951171875, 0.3427886962890625, 0.360626220703125, 0.3784637451171875, 0.39630126953125, 0.4141387939453125, 0.431976318359375, 0.4498138427734375, 0.4676513671875, 0.4854888916015625, 0.503326416015625, 0.5211639404296875, 0.53900146484375, 0.5568389892578125, 0.574676513671875, 0.5925140380859375, 0.6103515625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 16.0, 46.0, 121.0, 320.0, 338.0, 117.0, 28.0, 7.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.74886417388916, -4.591914176940918, -4.434964656829834, -4.278014659881592, -4.121065139770508, -3.9641153812408447, -3.8071656227111816, -3.6502156257629395, -3.4932661056518555, -3.3363163471221924, -3.1793665885925293, -3.022416830062866, -2.865467071533203, -2.70851731300354, -2.551567554473877, -2.3946175575256348, -2.2376677989959717, -2.0807180404663086, -1.9237682819366455, -1.7668185234069824, -1.6098687648773193, -1.4529190063476562, -1.2959691286087036, -1.1390193700790405, -0.9820696115493774, -0.8251198530197144, -0.6681700944900513, -0.5112202763557434, -0.3542705178260803, -0.19732075929641724, -0.040370941162109375, 0.11657881736755371, 0.2735285758972168, 0.4304783344268799, 0.587428092956543, 0.7443779110908508, 0.9013276696205139, 1.0582773685455322, 1.2152272462844849, 1.372177004814148, 1.529126763343811, 1.6860765218734741, 1.8430262804031372, 1.9999761581420898, 2.156925916671753, 2.313875675201416, 2.470825433731079, 2.627775192260742, 2.7847249507904053, 2.9416747093200684, 3.0986244678497314, 3.2555742263793945, 3.4125239849090576, 3.5694737434387207, 3.726423740386963, 3.883373260498047, 4.040323257446289, 4.197273254394531, 4.354222774505615, 4.511172771453857, 4.668122291564941, 4.825072288513184, 4.982021808624268, 5.13897180557251, 5.295921325683594]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 8.0, 6.0, 7.0, 7.0, 11.0, 11.0, 18.0, 25.0, 14.0, 27.0, 31.0, 31.0, 31.0, 38.0, 40.0, 47.0, 49.0, 48.0, 40.0, 42.0, 35.0, 48.0, 47.0, 32.0, 40.0, 39.0, 32.0, 34.0, 24.0, 15.0, 15.0, 11.0, 11.0, 14.0, 12.0, 9.0, 4.0, 5.0, 5.0, 5.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.5518990755081177, -1.5057920217514038, -1.4596848487854004, -1.4135777950286865, -1.367470622062683, -1.3213635683059692, -1.2752563953399658, -1.229149341583252, -1.183042287826538, -1.1369352340698242, -1.0908280611038208, -1.044721007347107, -0.9986138343811035, -0.9525067806243896, -0.906399667263031, -0.8602925539016724, -0.814185380935669, -0.7680782675743103, -0.7219711542129517, -0.6758641004562378, -0.6297569274902344, -0.5836498737335205, -0.5375427603721619, -0.4914356470108032, -0.4453285336494446, -0.39922142028808594, -0.3531143069267273, -0.30700722336769104, -0.2609001100063324, -0.21479299664497375, -0.1686859130859375, -0.12257879972457886, -0.07647180557250977, -0.03036469966173172, 0.015742406249046326, 0.061849504709243774, 0.10795661807060242, 0.15406373143196106, 0.20017081499099731, 0.24627792835235596, 0.2923850417137146, 0.33849215507507324, 0.3845992684364319, 0.43070635199546814, 0.4768134653568268, 0.5229206085205078, 0.5690276622772217, 0.6151347756385803, 0.661241888999939, 0.7073490023612976, 0.7534561157226562, 0.7995631694793701, 0.8456703424453735, 0.8917773962020874, 0.937884509563446, 0.9839916229248047, 1.0300986766815186, 1.0762057304382324, 1.1223129034042358, 1.1684199571609497, 1.2145271301269531, 1.260634183883667, 1.3067412376403809, 1.3528484106063843, 1.3989555835723877]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 18.0, 12.0, 29.0, 41.0, 71.0, 175.0, 337.0, 902.0, 3066.0, 23734.0, 4068376.0, 89445.0, 5676.0, 1284.0, 541.0, 243.0, 137.0, 84.0, 40.0, 24.0, 12.0, 15.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.10546875, -1.0736007690429688, -1.0417327880859375, -1.0098648071289062, -0.977996826171875, -0.9461288452148438, -0.9142608642578125, -0.8823928833007812, -0.85052490234375, -0.8186569213867188, -0.7867889404296875, -0.7549209594726562, -0.723052978515625, -0.6911849975585938, -0.6593170166015625, -0.6274490356445312, -0.5955810546875, -0.5637130737304688, -0.5318450927734375, -0.49997711181640625, -0.468109130859375, -0.43624114990234375, -0.4043731689453125, -0.37250518798828125, -0.34063720703125, -0.30876922607421875, -0.2769012451171875, -0.24503326416015625, -0.213165283203125, -0.18129730224609375, -0.1494293212890625, -0.11756134033203125, -0.085693359375, -0.05382537841796875, -0.0219573974609375, 0.00991058349609375, 0.041778564453125, 0.07364654541015625, 0.1055145263671875, 0.13738250732421875, 0.16925048828125, 0.20111846923828125, 0.2329864501953125, 0.26485443115234375, 0.296722412109375, 0.32859039306640625, 0.3604583740234375, 0.39232635498046875, 0.4241943359375, 0.45606231689453125, 0.4879302978515625, 0.5197982788085938, 0.551666259765625, 0.5835342407226562, 0.6154022216796875, 0.6472702026367188, 0.67913818359375, 0.7110061645507812, 0.7428741455078125, 0.7747421264648438, 0.806610107421875, 0.8384780883789062, 0.8703460693359375, 0.9022140502929688, 0.93408203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 7.0, 17.0, 23.0, 34.0, 62.0, 74.0, 87.0, 99.0, 106.0, 95.0, 94.0, 90.0, 68.0, 54.0, 36.0, 22.0, 11.0, 11.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.171630859375, -0.1658935546875, -0.16015625, -0.1544189453125, -0.148681640625, -0.1429443359375, -0.13720703125, -0.1314697265625, -0.125732421875, -0.1199951171875, -0.1142578125, -0.1085205078125, -0.102783203125, -0.0970458984375, -0.09130859375, -0.0855712890625, -0.079833984375, -0.0740966796875, -0.068359375, -0.0626220703125, -0.056884765625, -0.0511474609375, -0.04541015625, -0.0396728515625, -0.033935546875, -0.0281982421875, -0.0224609375, -0.0167236328125, -0.010986328125, -0.0052490234375, 0.00048828125, 0.0062255859375, 0.011962890625, 0.0177001953125, 0.0234375, 0.0291748046875, 0.034912109375, 0.0406494140625, 0.04638671875, 0.0521240234375, 0.057861328125, 0.0635986328125, 0.0693359375, 0.0750732421875, 0.080810546875, 0.0865478515625, 0.09228515625, 0.0980224609375, 0.103759765625, 0.1094970703125, 0.115234375, 0.1209716796875, 0.126708984375, 0.1324462890625, 0.13818359375, 0.1439208984375, 0.149658203125, 0.1553955078125, 0.1611328125, 0.1668701171875, 0.172607421875, 0.1783447265625, 0.18408203125, 0.1898193359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 8.0, 17.0, 19.0, 32.0, 50.0, 87.0, 134.0, 239.0, 530.0, 1250.0, 4948.0, 54928.0, 4090656.0, 35265.0, 4023.0, 1100.0, 439.0, 237.0, 143.0, 65.0, 43.0, 26.0, 14.0, 18.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8916015625, -0.8623123168945312, -0.8330230712890625, -0.8037338256835938, -0.774444580078125, -0.7451553344726562, -0.7158660888671875, -0.6865768432617188, -0.65728759765625, -0.6279983520507812, -0.5987091064453125, -0.5694198608398438, -0.540130615234375, -0.5108413696289062, -0.4815521240234375, -0.45226287841796875, -0.4229736328125, -0.39368438720703125, -0.3643951416015625, -0.33510589599609375, -0.305816650390625, -0.27652740478515625, -0.2472381591796875, -0.21794891357421875, -0.18865966796875, -0.15937042236328125, -0.1300811767578125, -0.10079193115234375, -0.071502685546875, -0.04221343994140625, -0.0129241943359375, 0.01636505126953125, 0.045654296875, 0.07494354248046875, 0.1042327880859375, 0.13352203369140625, 0.162811279296875, 0.19210052490234375, 0.2213897705078125, 0.25067901611328125, 0.27996826171875, 0.30925750732421875, 0.3385467529296875, 0.36783599853515625, 0.397125244140625, 0.42641448974609375, 0.4557037353515625, 0.48499298095703125, 0.5142822265625, 0.5435714721679688, 0.5728607177734375, 0.6021499633789062, 0.631439208984375, 0.6607284545898438, 0.6900177001953125, 0.7193069458007812, 0.74859619140625, 0.7778854370117188, 0.8071746826171875, 0.8364639282226562, 0.865753173828125, 0.8950424194335938, 0.9243316650390625, 0.9536209106445312, 0.98291015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 10.0, 9.0, 10.0, 22.0, 49.0, 168.0, 1484.0, 2027.0, 182.0, 62.0, 22.0, 11.0, 8.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30224609375, -0.2930946350097656, -0.28394317626953125, -0.2747917175292969, -0.2656402587890625, -0.2564888000488281, -0.24733734130859375, -0.23818588256835938, -0.229034423828125, -0.21988296508789062, -0.21073150634765625, -0.20158004760742188, -0.1924285888671875, -0.18327713012695312, -0.17412567138671875, -0.16497421264648438, -0.15582275390625, -0.14667129516601562, -0.13751983642578125, -0.12836837768554688, -0.1192169189453125, -0.11006546020507812, -0.10091400146484375, -0.09176254272460938, -0.082611083984375, -0.07345962524414062, -0.06430816650390625, -0.055156707763671875, -0.0460052490234375, -0.036853790283203125, -0.02770233154296875, -0.018550872802734375, -0.0093994140625, -0.000247955322265625, 0.00890350341796875, 0.018054962158203125, 0.0272064208984375, 0.036357879638671875, 0.04550933837890625, 0.054660797119140625, 0.063812255859375, 0.07296371459960938, 0.08211517333984375, 0.09126663208007812, 0.1004180908203125, 0.10956954956054688, 0.11872100830078125, 0.12787246704101562, 0.13702392578125, 0.14617538452148438, 0.15532684326171875, 0.16447830200195312, 0.1736297607421875, 0.18278121948242188, 0.19193267822265625, 0.20108413696289062, 0.210235595703125, 0.21938705444335938, 0.22853851318359375, 0.23768997192382812, 0.2468414306640625, 0.2559928894042969, 0.26514434814453125, 0.2742958068847656, 0.283447265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 15.0, 55.0, 231.0, 422.0, 198.0, 47.0, 20.0, 2.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0669002532958984, -2.0030205249786377, -1.939140796661377, -1.8752609491348267, -1.811381220817566, -1.7475014925003052, -1.6836216449737549, -1.6197419166564941, -1.5558621883392334, -1.4919824600219727, -1.428102731704712, -1.3642228841781616, -1.3003431558609009, -1.2364634275436401, -1.1725835800170898, -1.108703851699829, -1.0448241233825684, -0.9809443950653076, -0.9170646071434021, -0.8531848192214966, -0.7893050909042358, -0.7254253625869751, -0.6615455746650696, -0.5976657867431641, -0.5337860584259033, -0.4699063003063202, -0.40602654218673706, -0.34214678406715393, -0.2782670259475708, -0.21438726782798767, -0.15050750970840454, -0.08662775158882141, -0.022748231887817383, 0.04113152623176575, 0.10501128435134888, 0.168891042470932, 0.23277080059051514, 0.29665055871009827, 0.3605303168296814, 0.4244100749492645, 0.48828983306884766, 0.5521695613861084, 0.6160493493080139, 0.6799291372299194, 0.7438088655471802, 0.8076885938644409, 0.8715683817863464, 0.935448169708252, 0.9993278980255127, 1.0632076263427734, 1.1270873546600342, 1.1909672021865845, 1.2548469305038452, 1.318726658821106, 1.3826065063476562, 1.446486234664917, 1.5103659629821777, 1.5742456912994385, 1.6381254196166992, 1.7020052671432495, 1.7658849954605103, 1.829764723777771, 1.8936445713043213, 1.957524299621582, 2.0214040279388428]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 14.0, 16.0, 23.0, 30.0, 43.0, 67.0, 70.0, 90.0, 96.0, 92.0, 96.0, 82.0, 68.0, 67.0, 45.0, 28.0, 29.0, 14.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6373637914657593, -0.6132196187973022, -0.5890754461288452, -0.5649312734603882, -0.5407871007919312, -0.5166428685188293, -0.4924986958503723, -0.4683545231819153, -0.44421035051345825, -0.4200661778450012, -0.3959220051765442, -0.37177780270576477, -0.34763363003730774, -0.3234894573688507, -0.2993452548980713, -0.27520108222961426, -0.2510569095611572, -0.2269127368927002, -0.20276854932308197, -0.17862436175346375, -0.1544801890850067, -0.13033601641654968, -0.10619182884693146, -0.08204764127731323, -0.0579034686088562, -0.03375928848981857, -0.009615108370780945, 0.014529071748256683, 0.03867325186729431, 0.06281743198633194, 0.08696161210536957, 0.11110579967498779, 0.13524991273880005, 0.15939408540725708, 0.1835382729768753, 0.20768246054649353, 0.23182663321495056, 0.2559708058834076, 0.280115008354187, 0.30425918102264404, 0.3284033536911011, 0.3525475263595581, 0.37669169902801514, 0.40083590149879456, 0.4249800741672516, 0.4491242468357086, 0.47326844930648804, 0.49741262197494507, 0.5215567946434021, 0.5457009673118591, 0.5698451399803162, 0.5939893126487732, 0.618133544921875, 0.642277717590332, 0.6664218902587891, 0.6905660629272461, 0.7147102355957031, 0.7388544082641602, 0.7629985809326172, 0.7871427536010742, 0.8112869262695312, 0.8354311585426331, 0.8595753312110901, 0.8837195038795471, 0.9078636765480042]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 12.0, 20.0, 25.0, 39.0, 78.0, 126.0, 231.0, 480.0, 1251.0, 4620.0, 34030.0, 664377.0, 320260.0, 18063.0, 3109.0, 936.0, 413.0, 196.0, 112.0, 71.0, 28.0, 30.0, 12.0, 7.0, 12.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79296875, -0.7695541381835938, -0.7461395263671875, -0.7227249145507812, -0.699310302734375, -0.6758956909179688, -0.6524810791015625, -0.6290664672851562, -0.60565185546875, -0.5822372436523438, -0.5588226318359375, -0.5354080200195312, -0.511993408203125, -0.48857879638671875, -0.4651641845703125, -0.44174957275390625, -0.4183349609375, -0.39492034912109375, -0.3715057373046875, -0.34809112548828125, -0.324676513671875, -0.30126190185546875, -0.2778472900390625, -0.25443267822265625, -0.23101806640625, -0.20760345458984375, -0.1841888427734375, -0.16077423095703125, -0.137359619140625, -0.11394500732421875, -0.0905303955078125, -0.06711578369140625, -0.043701171875, -0.02028656005859375, 0.0031280517578125, 0.02654266357421875, 0.049957275390625, 0.07337188720703125, 0.0967864990234375, 0.12020111083984375, 0.14361572265625, 0.16703033447265625, 0.1904449462890625, 0.21385955810546875, 0.237274169921875, 0.26068878173828125, 0.2841033935546875, 0.30751800537109375, 0.3309326171875, 0.35434722900390625, 0.3777618408203125, 0.40117645263671875, 0.424591064453125, 0.44800567626953125, 0.4714202880859375, 0.49483489990234375, 0.51824951171875, 0.5416641235351562, 0.5650787353515625, 0.5884933471679688, 0.611907958984375, 0.6353225708007812, 0.6587371826171875, 0.6821517944335938, 0.70556640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 9.0, 17.0, 30.0, 39.0, 67.0, 73.0, 114.0, 87.0, 104.0, 112.0, 107.0, 83.0, 57.0, 49.0, 20.0, 15.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1917724609375, -0.18567848205566406, -0.17958450317382812, -0.1734905242919922, -0.16739654541015625, -0.1613025665283203, -0.15520858764648438, -0.14911460876464844, -0.1430206298828125, -0.13692665100097656, -0.13083267211914062, -0.12473869323730469, -0.11864471435546875, -0.11255073547363281, -0.10645675659179688, -0.10036277770996094, -0.094268798828125, -0.08817481994628906, -0.08208084106445312, -0.07598686218261719, -0.06989288330078125, -0.06379890441894531, -0.057704925537109375, -0.05161094665527344, -0.0455169677734375, -0.03942298889160156, -0.033329010009765625, -0.027235031127929688, -0.02114105224609375, -0.015047073364257812, -0.008953094482421875, -0.0028591156005859375, 0.00323486328125, 0.009328842163085938, 0.015422821044921875, 0.021516799926757812, 0.02761077880859375, 0.03370475769042969, 0.039798736572265625, 0.04589271545410156, 0.0519866943359375, 0.05808067321777344, 0.06417465209960938, 0.07026863098144531, 0.07636260986328125, 0.08245658874511719, 0.08855056762695312, 0.09464454650878906, 0.100738525390625, 0.10683250427246094, 0.11292648315429688, 0.11902046203613281, 0.12511444091796875, 0.1312084197998047, 0.13730239868164062, 0.14339637756347656, 0.1494903564453125, 0.15558433532714844, 0.16167831420898438, 0.1677722930908203, 0.17386627197265625, 0.1799602508544922, 0.18605422973632812, 0.19214820861816406, 0.1982421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 8.0, 8.0, 19.0, 13.0, 17.0, 38.0, 35.0, 58.0, 79.0, 135.0, 258.0, 536.0, 1709.0, 5982.0, 28431.0, 201684.0, 650360.0, 132125.0, 20249.0, 4433.0, 1307.0, 497.0, 215.0, 112.0, 58.0, 54.0, 30.0, 19.0, 19.0, 16.0, 15.0, 4.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322265625, -0.3116645812988281, -0.30106353759765625, -0.2904624938964844, -0.2798614501953125, -0.2692604064941406, -0.25865936279296875, -0.24805831909179688, -0.237457275390625, -0.22685623168945312, -0.21625518798828125, -0.20565414428710938, -0.1950531005859375, -0.18445205688476562, -0.17385101318359375, -0.16324996948242188, -0.15264892578125, -0.14204788208007812, -0.13144683837890625, -0.12084579467773438, -0.1102447509765625, -0.09964370727539062, -0.08904266357421875, -0.07844161987304688, -0.067840576171875, -0.057239532470703125, -0.04663848876953125, -0.036037445068359375, -0.0254364013671875, -0.014835357666015625, -0.00423431396484375, 0.006366729736328125, 0.0169677734375, 0.027568817138671875, 0.03816986083984375, 0.048770904541015625, 0.0593719482421875, 0.06997299194335938, 0.08057403564453125, 0.09117507934570312, 0.101776123046875, 0.11237716674804688, 0.12297821044921875, 0.13357925415039062, 0.1441802978515625, 0.15478134155273438, 0.16538238525390625, 0.17598342895507812, 0.18658447265625, 0.19718551635742188, 0.20778656005859375, 0.21838760375976562, 0.2289886474609375, 0.23958969116210938, 0.25019073486328125, 0.2607917785644531, 0.271392822265625, 0.2819938659667969, 0.29259490966796875, 0.3031959533691406, 0.3137969970703125, 0.3243980407714844, 0.33499908447265625, 0.3456001281738281, 0.356201171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 12.0, 8.0, 9.0, 11.0, 14.0, 13.0, 13.0, 14.0, 25.0, 32.0, 32.0, 29.0, 30.0, 43.0, 48.0, 41.0, 34.0, 57.0, 47.0, 49.0, 35.0, 48.0, 40.0, 45.0, 33.0, 34.0, 28.0, 24.0, 27.0, 19.0, 32.0, 20.0, 7.0, 11.0, 10.0, 3.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.273681640625, -0.2647056579589844, -0.25572967529296875, -0.24675369262695312, -0.2377777099609375, -0.22880172729492188, -0.21982574462890625, -0.21084976196289062, -0.201873779296875, -0.19289779663085938, -0.18392181396484375, -0.17494583129882812, -0.1659698486328125, -0.15699386596679688, -0.14801788330078125, -0.13904190063476562, -0.13006591796875, -0.12108993530273438, -0.11211395263671875, -0.10313796997070312, -0.0941619873046875, -0.08518600463867188, -0.07621002197265625, -0.06723403930664062, -0.058258056640625, -0.049282073974609375, -0.04030609130859375, -0.031330108642578125, -0.0223541259765625, -0.013378143310546875, -0.00440216064453125, 0.004573822021484375, 0.0135498046875, 0.022525787353515625, 0.03150177001953125, 0.040477752685546875, 0.0494537353515625, 0.058429718017578125, 0.06740570068359375, 0.07638168334960938, 0.085357666015625, 0.09433364868164062, 0.10330963134765625, 0.11228561401367188, 0.1212615966796875, 0.13023757934570312, 0.13921356201171875, 0.14818954467773438, 0.15716552734375, 0.16614151000976562, 0.17511749267578125, 0.18409347534179688, 0.1930694580078125, 0.20204544067382812, 0.21102142333984375, 0.21999740600585938, 0.228973388671875, 0.23794937133789062, 0.24692535400390625, 0.2559013366699219, 0.2648773193359375, 0.2738533020019531, 0.28282928466796875, 0.2918052673339844, 0.30078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 9.0, 3.0, 6.0, 22.0, 19.0, 34.0, 60.0, 76.0, 123.0, 210.0, 373.0, 839.0, 2303.0, 9453.0, 78605.0, 648914.0, 275873.0, 24622.0, 4485.0, 1281.0, 498.0, 274.0, 158.0, 95.0, 61.0, 47.0, 30.0, 25.0, 18.0, 14.0, 7.0, 5.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1539306640625, -0.14908218383789062, -0.14423370361328125, -0.13938522338867188, -0.1345367431640625, -0.12968826293945312, -0.12483978271484375, -0.11999130249023438, -0.115142822265625, -0.11029434204101562, -0.10544586181640625, -0.10059738159179688, -0.0957489013671875, -0.09090042114257812, -0.08605194091796875, -0.08120346069335938, -0.07635498046875, -0.07150650024414062, -0.06665802001953125, -0.061809539794921875, -0.0569610595703125, -0.052112579345703125, -0.04726409912109375, -0.042415618896484375, -0.037567138671875, -0.032718658447265625, -0.02787017822265625, -0.023021697998046875, -0.0181732177734375, -0.013324737548828125, -0.00847625732421875, -0.003627777099609375, 0.001220703125, 0.006069183349609375, 0.01091766357421875, 0.015766143798828125, 0.0206146240234375, 0.025463104248046875, 0.03031158447265625, 0.035160064697265625, 0.040008544921875, 0.044857025146484375, 0.04970550537109375, 0.054553985595703125, 0.0594024658203125, 0.06425094604492188, 0.06909942626953125, 0.07394790649414062, 0.07879638671875, 0.08364486694335938, 0.08849334716796875, 0.09334182739257812, 0.0981903076171875, 0.10303878784179688, 0.10788726806640625, 0.11273574829101562, 0.117584228515625, 0.12243270874023438, 0.12728118896484375, 0.13212966918945312, 0.1369781494140625, 0.14182662963867188, 0.14667510986328125, 0.15152359008789062, 0.1563720703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 13.0, 24.0, 41.0, 75.0, 121.0, 182.0, 183.0, 151.0, 93.0, 53.0, 28.0, 13.0, 17.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004470348358154297, -0.00043696723878383636, -0.00042689964175224304, -0.0004168320447206497, -0.0004067644476890564, -0.0003966968506574631, -0.00038662925362586975, -0.00037656165659427643, -0.0003664940595626831, -0.0003564264625310898, -0.00034635886549949646, -0.00033629126846790314, -0.0003262236714363098, -0.0003161560744047165, -0.00030608847737312317, -0.00029602088034152985, -0.0002859532833099365, -0.0002758856862783432, -0.0002658180892467499, -0.00025575049221515656, -0.00024568289518356323, -0.0002356152981519699, -0.0002255477011203766, -0.00021548010408878326, -0.00020541250705718994, -0.00019534491002559662, -0.0001852773129940033, -0.00017520971596240997, -0.00016514211893081665, -0.00015507452189922333, -0.00014500692486763, -0.00013493932783603668, -0.00012487173080444336, -0.00011480413377285004, -0.00010473653674125671, -9.466893970966339e-05, -8.460134267807007e-05, -7.453374564647675e-05, -6.446614861488342e-05, -5.43985515832901e-05, -4.433095455169678e-05, -3.4263357520103455e-05, -2.4195760488510132e-05, -1.4128163456916809e-05, -4.060566425323486e-06, 6.0070306062698364e-06, 1.607462763786316e-05, 2.6142224669456482e-05, 3.6209821701049805e-05, 4.627741873264313e-05, 5.634501576423645e-05, 6.641261279582977e-05, 7.64802098274231e-05, 8.654780685901642e-05, 9.661540389060974e-05, 0.00010668300092220306, 0.00011675059795379639, 0.0001268181949853897, 0.00013688579201698303, 0.00014695338904857635, 0.00015702098608016968, 0.000167088583111763, 0.00017715618014335632, 0.00018722377717494965, 0.00019729137420654297]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 11.0, 9.0, 20.0, 29.0, 59.0, 144.0, 286.0, 815.0, 4432.0, 71730.0, 870650.0, 93860.0, 4921.0, 972.0, 319.0, 142.0, 67.0, 31.0, 18.0, 17.0, 6.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1976318359375, -0.19045448303222656, -0.18327713012695312, -0.1760997772216797, -0.16892242431640625, -0.1617450714111328, -0.15456771850585938, -0.14739036560058594, -0.1402130126953125, -0.13303565979003906, -0.12585830688476562, -0.11868095397949219, -0.11150360107421875, -0.10432624816894531, -0.09714889526367188, -0.08997154235839844, -0.082794189453125, -0.07561683654785156, -0.06843948364257812, -0.06126213073730469, -0.05408477783203125, -0.04690742492675781, -0.039730072021484375, -0.03255271911621094, -0.0253753662109375, -0.018198013305664062, -0.011020660400390625, -0.0038433074951171875, 0.00333404541015625, 0.010511398315429688, 0.017688751220703125, 0.024866104125976562, 0.03204345703125, 0.03922080993652344, 0.046398162841796875, 0.05357551574707031, 0.06075286865234375, 0.06793022155761719, 0.07510757446289062, 0.08228492736816406, 0.0894622802734375, 0.09663963317871094, 0.10381698608398438, 0.11099433898925781, 0.11817169189453125, 0.1253490447998047, 0.13252639770507812, 0.13970375061035156, 0.146881103515625, 0.15405845642089844, 0.16123580932617188, 0.1684131622314453, 0.17559051513671875, 0.1827678680419922, 0.18994522094726562, 0.19712257385253906, 0.2042999267578125, 0.21147727966308594, 0.21865463256835938, 0.2258319854736328, 0.23300933837890625, 0.2401866912841797, 0.24736404418945312, 0.25454139709472656, 0.26171875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 15.0, 24.0, 30.0, 84.0, 131.0, 195.0, 202.0, 146.0, 90.0, 50.0, 17.0, 10.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.17106246948242188, -0.16365814208984375, -0.15625381469726562, -0.1488494873046875, -0.14144515991210938, -0.13404083251953125, -0.12663650512695312, -0.119232177734375, -0.11182785034179688, -0.10442352294921875, -0.09701919555664062, -0.0896148681640625, -0.08221054077148438, -0.07480621337890625, -0.06740188598632812, -0.05999755859375, -0.052593231201171875, -0.04518890380859375, -0.037784576416015625, -0.0303802490234375, -0.022975921630859375, -0.01557159423828125, -0.008167266845703125, -0.000762939453125, 0.006641387939453125, 0.01404571533203125, 0.021450042724609375, 0.0288543701171875, 0.036258697509765625, 0.04366302490234375, 0.051067352294921875, 0.0584716796875, 0.06587600708007812, 0.07328033447265625, 0.08068466186523438, 0.0880889892578125, 0.09549331665039062, 0.10289764404296875, 0.11030197143554688, 0.117706298828125, 0.12511062622070312, 0.13251495361328125, 0.13991928100585938, 0.1473236083984375, 0.15472793579101562, 0.16213226318359375, 0.16953659057617188, 0.17694091796875, 0.18434524536132812, 0.19174957275390625, 0.19915390014648438, 0.2065582275390625, 0.21396255493164062, 0.22136688232421875, 0.22877120971679688, 0.236175537109375, 0.24357986450195312, 0.25098419189453125, 0.2583885192871094, 0.2657928466796875, 0.2731971740722656, 0.28060150146484375, 0.2880058288574219, 0.29541015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 11.0, 31.0, 77.0, 251.0, 360.0, 204.0, 51.0, 17.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.137864589691162, -2.9975500106811523, -2.8572354316711426, -2.716920852661133, -2.576606273651123, -2.4362916946411133, -2.2959768772125244, -2.1556622982025146, -2.015347719192505, -1.8750331401824951, -1.7347185611724854, -1.594403862953186, -1.4540892839431763, -1.3137747049331665, -1.1734600067138672, -1.0331454277038574, -0.8928308486938477, -0.7525162696838379, -0.6122016310691833, -0.4718870222568512, -0.33157241344451904, -0.19125783443450928, -0.050943195819854736, 0.0893714427947998, 0.22968602180480957, 0.3700006306171417, 0.5103152394294739, 0.6506298780441284, 0.7909444570541382, 0.931259036064148, 1.0715737342834473, 1.211888313293457, 1.352203369140625, 1.4925179481506348, 1.6328325271606445, 1.7731472253799438, 1.9134618043899536, 2.053776264190674, 2.1940910816192627, 2.3344056606292725, 2.4747202396392822, 2.615034818649292, 2.7553493976593018, 2.8956639766693115, 3.0359787940979004, 3.17629337310791, 3.31660795211792, 3.4569225311279297, 3.5972371101379395, 3.737551689147949, 3.877866268157959, 4.018180847167969, 4.1584954261779785, 4.298810005187988, 4.439124584197998, 4.579439163208008, 4.719754219055176, 4.8600687980651855, 5.000383377075195, 5.140697956085205, 5.281012535095215, 5.421327114105225, 5.561641693115234, 5.701956748962402, 5.842270851135254]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 14.0, 13.0, 13.0, 18.0, 22.0, 26.0, 27.0, 30.0, 38.0, 39.0, 38.0, 40.0, 51.0, 55.0, 44.0, 70.0, 51.0, 40.0, 51.0, 51.0, 32.0, 43.0, 30.0, 31.0, 25.0, 24.0, 16.0, 16.0, 8.0, 11.0, 11.0, 7.0, 9.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.80057692527771, -1.7496801614761353, -1.6987833976745605, -1.6478866338729858, -1.5969898700714111, -1.5460931062698364, -1.4951963424682617, -1.444299578666687, -1.3934028148651123, -1.3425060510635376, -1.291609287261963, -1.2407125234603882, -1.1898157596588135, -1.1389189958572388, -1.088022232055664, -1.0371254682540894, -0.9862286448478699, -0.9353318810462952, -0.8844351172447205, -0.8335383534431458, -0.782641589641571, -0.7317447662353516, -0.6808480024337769, -0.6299512386322021, -0.5790544748306274, -0.5281577110290527, -0.477260947227478, -0.4263641834259033, -0.3754674196243286, -0.3245706260204315, -0.2736738622188568, -0.2227770984172821, -0.17188036441802979, -0.12098360061645508, -0.07008682936429977, -0.01919005811214447, 0.03170670568943024, 0.08260348439216614, 0.13350024819374084, 0.18439701199531555, 0.23529377579689026, 0.28619053959846497, 0.3370873034000397, 0.38798409700393677, 0.4388808608055115, 0.4897776246070862, 0.5406743884086609, 0.5915711522102356, 0.6424679160118103, 0.693364679813385, 0.7442614436149597, 0.7951582074165344, 0.8460549712181091, 0.8969517946243286, 0.9478485584259033, 0.998745322227478, 1.0496420860290527, 1.1005388498306274, 1.1514356136322021, 1.2023323774337769, 1.2532291412353516, 1.3041259050369263, 1.355022668838501, 1.4059194326400757, 1.4568161964416504]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 12.0, 26.0, 45.0, 71.0, 127.0, 245.0, 504.0, 1353.0, 4897.0, 35421.0, 4087816.0, 54870.0, 5985.0, 1537.0, 625.0, 301.0, 176.0, 98.0, 57.0, 31.0, 17.0, 10.0, 13.0, 7.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3095703125, -1.27056884765625, -1.2315673828125, -1.19256591796875, -1.153564453125, -1.11456298828125, -1.0755615234375, -1.03656005859375, -0.99755859375, -0.95855712890625, -0.9195556640625, -0.88055419921875, -0.841552734375, -0.80255126953125, -0.7635498046875, -0.72454833984375, -0.685546875, -0.64654541015625, -0.6075439453125, -0.56854248046875, -0.529541015625, -0.49053955078125, -0.4515380859375, -0.41253662109375, -0.37353515625, -0.33453369140625, -0.2955322265625, -0.25653076171875, -0.217529296875, -0.17852783203125, -0.1395263671875, -0.10052490234375, -0.0615234375, -0.02252197265625, 0.0164794921875, 0.05548095703125, 0.094482421875, 0.13348388671875, 0.1724853515625, 0.21148681640625, 0.25048828125, 0.28948974609375, 0.3284912109375, 0.36749267578125, 0.406494140625, 0.44549560546875, 0.4844970703125, 0.52349853515625, 0.5625, 0.60150146484375, 0.6405029296875, 0.67950439453125, 0.718505859375, 0.75750732421875, 0.7965087890625, 0.83551025390625, 0.87451171875, 0.91351318359375, 0.9525146484375, 0.99151611328125, 1.030517578125, 1.06951904296875, 1.1085205078125, 1.14752197265625, 1.1865234375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 2.0, 12.0, 13.0, 27.0, 34.0, 58.0, 70.0, 85.0, 84.0, 91.0, 110.0, 83.0, 90.0, 74.0, 52.0, 41.0, 28.0, 19.0, 13.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1939697265625, -0.1882762908935547, -0.18258285522460938, -0.17688941955566406, -0.17119598388671875, -0.16550254821777344, -0.15980911254882812, -0.1541156768798828, -0.1484222412109375, -0.1427288055419922, -0.13703536987304688, -0.13134193420410156, -0.12564849853515625, -0.11995506286621094, -0.11426162719726562, -0.10856819152832031, -0.102874755859375, -0.09718132019042969, -0.09148788452148438, -0.08579444885253906, -0.08010101318359375, -0.07440757751464844, -0.06871414184570312, -0.06302070617675781, -0.0573272705078125, -0.05163383483886719, -0.045940399169921875, -0.04024696350097656, -0.03455352783203125, -0.028860092163085938, -0.023166656494140625, -0.017473220825195312, -0.01177978515625, -0.0060863494873046875, -0.000392913818359375, 0.0053005218505859375, 0.01099395751953125, 0.016687393188476562, 0.022380828857421875, 0.028074264526367188, 0.0337677001953125, 0.03946113586425781, 0.045154571533203125, 0.05084800720214844, 0.05654144287109375, 0.06223487854003906, 0.06792831420898438, 0.07362174987792969, 0.079315185546875, 0.08500862121582031, 0.09070205688476562, 0.09639549255371094, 0.10208892822265625, 0.10778236389160156, 0.11347579956054688, 0.11916923522949219, 0.1248626708984375, 0.1305561065673828, 0.13624954223632812, 0.14194297790527344, 0.14763641357421875, 0.15332984924316406, 0.15902328491210938, 0.1647167205810547, 0.17041015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 1.0, 5.0, 3.0, 5.0, 8.0, 9.0, 14.0, 22.0, 28.0, 44.0, 58.0, 77.0, 84.0, 134.0, 221.0, 301.0, 537.0, 882.0, 1666.0, 3922.0, 15350.0, 150819.0, 3929683.0, 74154.0, 9875.0, 2942.0, 1350.0, 747.0, 418.0, 302.0, 178.0, 126.0, 75.0, 61.0, 56.0, 39.0, 24.0, 17.0, 9.0, 5.0, 8.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.517578125, -0.5005416870117188, -0.4835052490234375, -0.46646881103515625, -0.449432373046875, -0.43239593505859375, -0.4153594970703125, -0.39832305908203125, -0.38128662109375, -0.36425018310546875, -0.3472137451171875, -0.33017730712890625, -0.313140869140625, -0.29610443115234375, -0.2790679931640625, -0.26203155517578125, -0.2449951171875, -0.22795867919921875, -0.2109222412109375, -0.19388580322265625, -0.176849365234375, -0.15981292724609375, -0.1427764892578125, -0.12574005126953125, -0.10870361328125, -0.09166717529296875, -0.0746307373046875, -0.05759429931640625, -0.040557861328125, -0.02352142333984375, -0.0064849853515625, 0.01055145263671875, 0.027587890625, 0.04462432861328125, 0.0616607666015625, 0.07869720458984375, 0.095733642578125, 0.11277008056640625, 0.1298065185546875, 0.14684295654296875, 0.16387939453125, 0.18091583251953125, 0.1979522705078125, 0.21498870849609375, 0.232025146484375, 0.24906158447265625, 0.2660980224609375, 0.28313446044921875, 0.3001708984375, 0.31720733642578125, 0.3342437744140625, 0.35128021240234375, 0.368316650390625, 0.38535308837890625, 0.4023895263671875, 0.41942596435546875, 0.43646240234375, 0.45349884033203125, 0.4705352783203125, 0.48757171630859375, 0.504608154296875, 0.5216445922851562, 0.5386810302734375, 0.5557174682617188, 0.57275390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 5.0, 9.0, 12.0, 31.0, 74.0, 210.0, 2981.0, 562.0, 121.0, 36.0, 12.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.417236328125, -0.4072399139404297, -0.3972434997558594, -0.38724708557128906, -0.37725067138671875, -0.36725425720214844, -0.3572578430175781, -0.3472614288330078, -0.3372650146484375, -0.3272686004638672, -0.3172721862792969, -0.30727577209472656, -0.29727935791015625, -0.28728294372558594, -0.2772865295410156, -0.2672901153564453, -0.257293701171875, -0.2472972869873047, -0.23730087280273438, -0.22730445861816406, -0.21730804443359375, -0.20731163024902344, -0.19731521606445312, -0.1873188018798828, -0.1773223876953125, -0.1673259735107422, -0.15732955932617188, -0.14733314514160156, -0.13733673095703125, -0.12734031677246094, -0.11734390258789062, -0.10734748840332031, -0.09735107421875, -0.08735466003417969, -0.07735824584960938, -0.06736183166503906, -0.05736541748046875, -0.04736900329589844, -0.037372589111328125, -0.027376174926757812, -0.0173797607421875, -0.0073833465576171875, 0.002613067626953125, 0.012609481811523438, 0.02260589599609375, 0.03260231018066406, 0.042598724365234375, 0.05259513854980469, 0.062591552734375, 0.07258796691894531, 0.08258438110351562, 0.09258079528808594, 0.10257720947265625, 0.11257362365722656, 0.12257003784179688, 0.1325664520263672, 0.1425628662109375, 0.1525592803955078, 0.16255569458007812, 0.17255210876464844, 0.18254852294921875, 0.19254493713378906, 0.20254135131835938, 0.2125377655029297, 0.2225341796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 27.0, 131.0, 399.0, 332.0, 68.0, 11.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9986463785171509, -1.931889295578003, -1.8651320934295654, -1.7983750104904175, -1.7316179275512695, -1.6648608446121216, -1.5981037616729736, -1.5313465595245361, -1.4645894765853882, -1.3978323936462402, -1.3310751914978027, -1.2643181085586548, -1.1975610256195068, -1.1308039426803589, -1.064046859741211, -0.9972896575927734, -0.9305325746536255, -0.8637754917144775, -0.7970183491706848, -0.7302612066268921, -0.6635041236877441, -0.5967470407485962, -0.5299898982048035, -0.46323278546333313, -0.3964756727218628, -0.32971855998039246, -0.2629614472389221, -0.19620433449745178, -0.12944722175598145, -0.06269010901451111, 0.0040670037269592285, 0.07082411646842957, 0.13758111000061035, 0.2043382227420807, 0.271095335483551, 0.33785244822502136, 0.4046095609664917, 0.47136667370796204, 0.5381237864494324, 0.6048809289932251, 0.671638011932373, 0.738395094871521, 0.8051522374153137, 0.8719093799591064, 0.9386664628982544, 1.0054235458374023, 1.0721807479858398, 1.1389378309249878, 1.2056949138641357, 1.2724519968032837, 1.3392090797424316, 1.4059662818908691, 1.472723364830017, 1.539480447769165, 1.6062376499176025, 1.6729947328567505, 1.7397518157958984, 1.8065088987350464, 1.8732659816741943, 1.9400231838226318, 2.0067801475524902, 2.0735373497009277, 2.1402945518493652, 2.2070515155792236, 2.273808717727661]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 12.0, 19.0, 24.0, 35.0, 38.0, 48.0, 67.0, 80.0, 98.0, 78.0, 92.0, 67.0, 70.0, 63.0, 37.0, 41.0, 30.0, 26.0, 17.0, 15.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5990517735481262, -0.5756936073303223, -0.5523354411125183, -0.5289772748947144, -0.5056191086769104, -0.48226094245910645, -0.4589027762413025, -0.43554461002349854, -0.4121864438056946, -0.3888282775878906, -0.36547011137008667, -0.3421119451522827, -0.31875377893447876, -0.2953956127166748, -0.27203744649887085, -0.2486792653799057, -0.22532108426094055, -0.2019629180431366, -0.17860475182533264, -0.1552465856075287, -0.13188841938972473, -0.10853024572134018, -0.08517207205295563, -0.06181390583515167, -0.03845573961734772, -0.015097571536898613, 0.008260596543550491, 0.031618766486644745, 0.0549769327044487, 0.07833509892225266, 0.10169327259063721, 0.12505143880844116, 0.14840960502624512, 0.17176777124404907, 0.19512593746185303, 0.21848410367965698, 0.24184226989746094, 0.2652004361152649, 0.28855860233306885, 0.3119167685508728, 0.33527493476867676, 0.3586331009864807, 0.38199126720428467, 0.4053494334220886, 0.4287075996398926, 0.45206576585769653, 0.4754239320755005, 0.49878209829330444, 0.5221402645111084, 0.5454984307289124, 0.5688565969467163, 0.5922147631645203, 0.6155729293823242, 0.6389310956001282, 0.6622892618179321, 0.6856474280357361, 0.7090056538581848, 0.7323638200759888, 0.7557219862937927, 0.7790801525115967, 0.8024383187294006, 0.8257964849472046, 0.8491546511650085, 0.8725128173828125, 0.8958709836006165]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 6.0, 6.0, 5.0, 7.0, 13.0, 25.0, 15.0, 23.0, 39.0, 59.0, 74.0, 120.0, 154.0, 256.0, 412.0, 670.0, 1316.0, 2903.0, 8057.0, 26664.0, 113082.0, 480292.0, 319815.0, 66865.0, 17218.0, 5661.0, 2168.0, 1056.0, 547.0, 307.0, 192.0, 133.0, 110.0, 79.0, 57.0, 40.0, 22.0, 26.0, 17.0, 9.0, 7.0, 7.0, 5.0, 6.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.372802734375, -0.3617820739746094, -0.35076141357421875, -0.3397407531738281, -0.3287200927734375, -0.3176994323730469, -0.30667877197265625, -0.2956581115722656, -0.284637451171875, -0.2736167907714844, -0.26259613037109375, -0.2515754699707031, -0.2405548095703125, -0.22953414916992188, -0.21851348876953125, -0.20749282836914062, -0.19647216796875, -0.18545150756835938, -0.17443084716796875, -0.16341018676757812, -0.1523895263671875, -0.14136886596679688, -0.13034820556640625, -0.11932754516601562, -0.108306884765625, -0.09728622436523438, -0.08626556396484375, -0.07524490356445312, -0.0642242431640625, -0.053203582763671875, -0.04218292236328125, -0.031162261962890625, -0.0201416015625, -0.009120941162109375, 0.00189971923828125, 0.012920379638671875, 0.0239410400390625, 0.034961700439453125, 0.04598236083984375, 0.057003021240234375, 0.068023681640625, 0.07904434204101562, 0.09006500244140625, 0.10108566284179688, 0.1121063232421875, 0.12312698364257812, 0.13414764404296875, 0.14516830444335938, 0.15618896484375, 0.16720962524414062, 0.17823028564453125, 0.18925094604492188, 0.2002716064453125, 0.21129226684570312, 0.22231292724609375, 0.23333358764648438, 0.244354248046875, 0.2553749084472656, 0.26639556884765625, 0.2774162292480469, 0.2884368896484375, 0.2994575500488281, 0.31047821044921875, 0.3214988708496094, 0.33251953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 8.0, 17.0, 23.0, 31.0, 39.0, 62.0, 67.0, 86.0, 98.0, 99.0, 101.0, 77.0, 72.0, 75.0, 53.0, 24.0, 30.0, 15.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2081298828125, -0.2022876739501953, -0.19644546508789062, -0.19060325622558594, -0.18476104736328125, -0.17891883850097656, -0.17307662963867188, -0.1672344207763672, -0.1613922119140625, -0.1555500030517578, -0.14970779418945312, -0.14386558532714844, -0.13802337646484375, -0.13218116760253906, -0.12633895874023438, -0.12049674987792969, -0.114654541015625, -0.10881233215332031, -0.10297012329101562, -0.09712791442871094, -0.09128570556640625, -0.08544349670410156, -0.07960128784179688, -0.07375907897949219, -0.0679168701171875, -0.06207466125488281, -0.056232452392578125, -0.05039024353027344, -0.04454803466796875, -0.03870582580566406, -0.032863616943359375, -0.027021408081054688, -0.02117919921875, -0.015336990356445312, -0.009494781494140625, -0.0036525726318359375, 0.00218963623046875, 0.008031845092773438, 0.013874053955078125, 0.019716262817382812, 0.0255584716796875, 0.03140068054199219, 0.037242889404296875, 0.04308509826660156, 0.04892730712890625, 0.05476951599121094, 0.060611724853515625, 0.06645393371582031, 0.072296142578125, 0.07813835144042969, 0.08398056030273438, 0.08982276916503906, 0.09566497802734375, 0.10150718688964844, 0.10734939575195312, 0.11319160461425781, 0.1190338134765625, 0.12487602233886719, 0.13071823120117188, 0.13656044006347656, 0.14240264892578125, 0.14824485778808594, 0.15408706665039062, 0.1599292755126953, 0.165771484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 14.0, 12.0, 16.0, 22.0, 39.0, 27.0, 58.0, 82.0, 106.0, 193.0, 261.0, 449.0, 772.0, 1434.0, 3392.0, 9689.0, 36643.0, 172237.0, 541195.0, 218324.0, 44475.0, 11483.0, 3875.0, 1645.0, 808.0, 408.0, 242.0, 183.0, 145.0, 82.0, 53.0, 50.0, 36.0, 25.0, 25.0, 13.0, 9.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2442626953125, -0.23627281188964844, -0.22828292846679688, -0.2202930450439453, -0.21230316162109375, -0.2043132781982422, -0.19632339477539062, -0.18833351135253906, -0.1803436279296875, -0.17235374450683594, -0.16436386108398438, -0.1563739776611328, -0.14838409423828125, -0.1403942108154297, -0.13240432739257812, -0.12441444396972656, -0.116424560546875, -0.10843467712402344, -0.10044479370117188, -0.09245491027832031, -0.08446502685546875, -0.07647514343261719, -0.06848526000976562, -0.06049537658691406, -0.0525054931640625, -0.04451560974121094, -0.036525726318359375, -0.028535842895507812, -0.02054595947265625, -0.012556076049804688, -0.004566192626953125, 0.0034236907958984375, 0.01141357421875, 0.019403457641601562, 0.027393341064453125, 0.03538322448730469, 0.04337310791015625, 0.05136299133300781, 0.059352874755859375, 0.06734275817871094, 0.0753326416015625, 0.08332252502441406, 0.09131240844726562, 0.09930229187011719, 0.10729217529296875, 0.11528205871582031, 0.12327194213867188, 0.13126182556152344, 0.139251708984375, 0.14724159240722656, 0.15523147583007812, 0.1632213592529297, 0.17121124267578125, 0.1792011260986328, 0.18719100952148438, 0.19518089294433594, 0.2031707763671875, 0.21116065979003906, 0.21915054321289062, 0.2271404266357422, 0.23513031005859375, 0.2431201934814453, 0.2511100769042969, 0.25909996032714844, 0.26708984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 8.0, 11.0, 14.0, 22.0, 22.0, 25.0, 26.0, 27.0, 34.0, 32.0, 29.0, 38.0, 36.0, 40.0, 39.0, 42.0, 59.0, 41.0, 44.0, 45.0, 42.0, 45.0, 37.0, 32.0, 35.0, 15.0, 21.0, 26.0, 15.0, 16.0, 13.0, 12.0, 12.0, 7.0, 4.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.433837890625, -0.42200469970703125, -0.4101715087890625, -0.39833831787109375, -0.386505126953125, -0.37467193603515625, -0.3628387451171875, -0.35100555419921875, -0.33917236328125, -0.32733917236328125, -0.3155059814453125, -0.30367279052734375, -0.291839599609375, -0.28000640869140625, -0.2681732177734375, -0.25634002685546875, -0.2445068359375, -0.23267364501953125, -0.2208404541015625, -0.20900726318359375, -0.197174072265625, -0.18534088134765625, -0.1735076904296875, -0.16167449951171875, -0.14984130859375, -0.13800811767578125, -0.1261749267578125, -0.11434173583984375, -0.102508544921875, -0.09067535400390625, -0.0788421630859375, -0.06700897216796875, -0.05517578125, -0.04334259033203125, -0.0315093994140625, -0.01967620849609375, -0.007843017578125, 0.00399017333984375, 0.0158233642578125, 0.02765655517578125, 0.03948974609375, 0.05132293701171875, 0.0631561279296875, 0.07498931884765625, 0.086822509765625, 0.09865570068359375, 0.1104888916015625, 0.12232208251953125, 0.1341552734375, 0.14598846435546875, 0.1578216552734375, 0.16965484619140625, 0.181488037109375, 0.19332122802734375, 0.2051544189453125, 0.21698760986328125, 0.22882080078125, 0.24065399169921875, 0.2524871826171875, 0.26432037353515625, 0.276153564453125, 0.28798675537109375, 0.2998199462890625, 0.31165313720703125, 0.323486328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 11.0, 36.0, 102.0, 415.0, 5786.0, 924535.0, 115932.0, 1462.0, 199.0, 40.0, 20.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52197265625, -0.50738525390625, -0.4927978515625, -0.47821044921875, -0.463623046875, -0.44903564453125, -0.4344482421875, -0.41986083984375, -0.4052734375, -0.39068603515625, -0.3760986328125, -0.36151123046875, -0.346923828125, -0.33233642578125, -0.3177490234375, -0.30316162109375, -0.28857421875, -0.27398681640625, -0.2593994140625, -0.24481201171875, -0.230224609375, -0.21563720703125, -0.2010498046875, -0.18646240234375, -0.171875, -0.15728759765625, -0.1427001953125, -0.12811279296875, -0.113525390625, -0.09893798828125, -0.0843505859375, -0.06976318359375, -0.05517578125, -0.04058837890625, -0.0260009765625, -0.01141357421875, 0.003173828125, 0.01776123046875, 0.0323486328125, 0.04693603515625, 0.0615234375, 0.07611083984375, 0.0906982421875, 0.10528564453125, 0.119873046875, 0.13446044921875, 0.1490478515625, 0.16363525390625, 0.17822265625, 0.19281005859375, 0.2073974609375, 0.22198486328125, 0.236572265625, 0.25115966796875, 0.2657470703125, 0.28033447265625, 0.294921875, 0.30950927734375, 0.3240966796875, 0.33868408203125, 0.353271484375, 0.36785888671875, 0.3824462890625, 0.39703369140625, 0.41162109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 10.0, 27.0, 32.0, 53.0, 93.0, 109.0, 220.0, 176.0, 100.0, 65.0, 47.0, 34.0, 16.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002999305725097656, -0.00028908252716064453, -0.00027823448181152344, -0.00026738643646240234, -0.00025653839111328125, -0.00024569034576416016, -0.00023484230041503906, -0.00022399425506591797, -0.00021314620971679688, -0.00020229816436767578, -0.0001914501190185547, -0.0001806020736694336, -0.0001697540283203125, -0.0001589059829711914, -0.0001480579376220703, -0.00013720989227294922, -0.00012636184692382812, -0.00011551380157470703, -0.00010466575622558594, -9.381771087646484e-05, -8.296966552734375e-05, -7.212162017822266e-05, -6.127357482910156e-05, -5.042552947998047e-05, -3.9577484130859375e-05, -2.872943878173828e-05, -1.7881393432617188e-05, -7.033348083496094e-06, 3.814697265625e-06, 1.4662742614746094e-05, 2.5510787963867188e-05, 3.635883331298828e-05, 4.7206878662109375e-05, 5.805492401123047e-05, 6.890296936035156e-05, 7.975101470947266e-05, 9.059906005859375e-05, 0.00010144710540771484, 0.00011229515075683594, 0.00012314319610595703, 0.00013399124145507812, 0.00014483928680419922, 0.0001556873321533203, 0.0001665353775024414, 0.0001773834228515625, 0.0001882314682006836, 0.0001990795135498047, 0.00020992755889892578, 0.00022077560424804688, 0.00023162364959716797, 0.00024247169494628906, 0.00025331974029541016, 0.00026416778564453125, 0.00027501583099365234, 0.00028586387634277344, 0.00029671192169189453, 0.0003075599670410156, 0.0003184080123901367, 0.0003292560577392578, 0.0003401041030883789, 0.0003509521484375, 0.0003618001937866211, 0.0003726482391357422, 0.0003834962844848633, 0.0003943443298339844]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 20.0, 29.0, 56.0, 111.0, 200.0, 553.0, 2651.0, 41972.0, 873104.0, 123915.0, 4685.0, 766.0, 221.0, 105.0, 64.0, 38.0, 15.0, 15.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.29278564453125, -0.2838134765625, -0.27484130859375, -0.265869140625, -0.25689697265625, -0.2479248046875, -0.23895263671875, -0.22998046875, -0.22100830078125, -0.2120361328125, -0.20306396484375, -0.194091796875, -0.18511962890625, -0.1761474609375, -0.16717529296875, -0.158203125, -0.14923095703125, -0.1402587890625, -0.13128662109375, -0.122314453125, -0.11334228515625, -0.1043701171875, -0.09539794921875, -0.08642578125, -0.07745361328125, -0.0684814453125, -0.05950927734375, -0.050537109375, -0.04156494140625, -0.0325927734375, -0.02362060546875, -0.0146484375, -0.00567626953125, 0.0032958984375, 0.01226806640625, 0.021240234375, 0.03021240234375, 0.0391845703125, 0.04815673828125, 0.05712890625, 0.06610107421875, 0.0750732421875, 0.08404541015625, 0.093017578125, 0.10198974609375, 0.1109619140625, 0.11993408203125, 0.12890625, 0.13787841796875, 0.1468505859375, 0.15582275390625, 0.164794921875, 0.17376708984375, 0.1827392578125, 0.19171142578125, 0.20068359375, 0.20965576171875, 0.2186279296875, 0.22760009765625, 0.236572265625, 0.24554443359375, 0.2545166015625, 0.26348876953125, 0.2724609375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 17.0, 50.0, 106.0, 186.0, 244.0, 204.0, 119.0, 50.0, 12.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.56689453125, -0.5556869506835938, -0.5444793701171875, -0.5332717895507812, -0.522064208984375, -0.5108566284179688, -0.4996490478515625, -0.48844146728515625, -0.47723388671875, -0.46602630615234375, -0.4548187255859375, -0.44361114501953125, -0.432403564453125, -0.42119598388671875, -0.4099884033203125, -0.39878082275390625, -0.3875732421875, -0.37636566162109375, -0.3651580810546875, -0.35395050048828125, -0.342742919921875, -0.33153533935546875, -0.3203277587890625, -0.30912017822265625, -0.29791259765625, -0.28670501708984375, -0.2754974365234375, -0.26428985595703125, -0.253082275390625, -0.24187469482421875, -0.2306671142578125, -0.21945953369140625, -0.208251953125, -0.19704437255859375, -0.1858367919921875, -0.17462921142578125, -0.163421630859375, -0.15221405029296875, -0.1410064697265625, -0.12979888916015625, -0.11859130859375, -0.10738372802734375, -0.0961761474609375, -0.08496856689453125, -0.073760986328125, -0.06255340576171875, -0.0513458251953125, -0.04013824462890625, -0.0289306640625, -0.01772308349609375, -0.0065155029296875, 0.00469207763671875, 0.015899658203125, 0.02710723876953125, 0.0383148193359375, 0.04952239990234375, 0.06072998046875, 0.07193756103515625, 0.0831451416015625, 0.09435272216796875, 0.105560302734375, 0.11676788330078125, 0.1279754638671875, 0.13918304443359375, 0.150390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 8.0, 21.0, 31.0, 103.0, 245.0, 277.0, 187.0, 79.0, 30.0, 9.0, 4.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.837831020355225, -5.712147235870361, -5.586463451385498, -5.460780143737793, -5.33509635925293, -5.209412574768066, -5.083728790283203, -4.95804500579834, -4.832361221313477, -4.706677436828613, -4.58099365234375, -4.455310344696045, -4.329626560211182, -4.203942775726318, -4.078258991241455, -3.952575206756592, -3.8268918991088867, -3.7012081146240234, -3.5755245685577393, -3.449840784072876, -3.324157238006592, -3.1984734535217285, -3.0727896690368652, -2.947105884552002, -2.8214223384857178, -2.6957385540008545, -2.5700550079345703, -2.444371223449707, -2.3186874389648438, -2.1930038928985596, -2.0673201084136963, -1.9416364431381226, -1.815953254699707, -1.6902695894241333, -1.5645859241485596, -1.4389021396636963, -1.3132184743881226, -1.1875348091125488, -1.0618510246276855, -0.9361673593521118, -0.8104836940765381, -0.6848000288009644, -0.5591163039207458, -0.43343260884284973, -0.3077489137649536, -0.18206524848937988, -0.05638152360916138, 0.06930220127105713, 0.19498586654663086, 0.320669561624527, 0.4463532567024231, 0.5720369815826416, 0.6977206468582153, 0.8234043121337891, 0.9490880370140076, 1.074771761894226, 1.2004554271697998, 1.3261390924453735, 1.4518227577209473, 1.5775065422058105, 1.7031902074813843, 1.828873872756958, 1.9545576572418213, 2.0802412033081055, 2.2059249877929688]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 11.0, 6.0, 7.0, 11.0, 15.0, 13.0, 13.0, 18.0, 20.0, 21.0, 25.0, 28.0, 35.0, 32.0, 41.0, 41.0, 40.0, 27.0, 31.0, 42.0, 45.0, 40.0, 43.0, 43.0, 41.0, 30.0, 26.0, 31.0, 38.0, 28.0, 17.0, 21.0, 20.0, 13.0, 22.0, 12.0, 9.0, 12.0, 8.0, 11.0, 9.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.745201587677002, -1.6897183656692505, -1.6342350244522095, -1.578751802444458, -1.523268461227417, -1.4677852392196655, -1.412302017211914, -1.356818675994873, -1.3013354539871216, -1.2458522319793701, -1.190368890762329, -1.1348856687545776, -1.0794024467468262, -1.0239191055297852, -0.9684358835220337, -0.9129526019096375, -0.8574693202972412, -0.801986038684845, -0.7465027570724487, -0.6910195350646973, -0.635536253452301, -0.5800529718399048, -0.5245697498321533, -0.4690864682197571, -0.41360318660736084, -0.3581199049949646, -0.30263665318489075, -0.2471533864736557, -0.19167011976242065, -0.13618683815002441, -0.08070358633995056, -0.02522033452987671, 0.03026282787322998, 0.08574609458446503, 0.14122936129570007, 0.19671262800693512, 0.25219589471817017, 0.3076791763305664, 0.36316242814064026, 0.4186456799507141, 0.47412896156311035, 0.5296122431755066, 0.5850955247879028, 0.6405787467956543, 0.6960620284080505, 0.7515453100204468, 0.8070285320281982, 0.8625118136405945, 0.9179950952529907, 0.973478376865387, 1.0289616584777832, 1.0844448804855347, 1.1399281024932861, 1.1954114437103271, 1.2508946657180786, 1.30637788772583, 1.361861228942871, 1.4173444509506226, 1.4728277921676636, 1.528311014175415, 1.583794355392456, 1.6392775774002075, 1.694760799407959, 1.750244140625, 1.8057273626327515]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 7.0, 5.0, 9.0, 4.0, 13.0, 20.0, 14.0, 33.0, 58.0, 58.0, 141.0, 270.0, 485.0, 965.0, 2115.0, 5613.0, 18651.0, 155817.0, 3941878.0, 50926.0, 10419.0, 3612.0, 1532.0, 708.0, 356.0, 193.0, 99.0, 87.0, 58.0, 33.0, 30.0, 19.0, 15.0, 9.0, 13.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.74267578125, -0.7216339111328125, -0.700592041015625, -0.6795501708984375, -0.65850830078125, -0.6374664306640625, -0.616424560546875, -0.5953826904296875, -0.5743408203125, -0.5532989501953125, -0.532257080078125, -0.5112152099609375, -0.49017333984375, -0.4691314697265625, -0.448089599609375, -0.4270477294921875, -0.406005859375, -0.3849639892578125, -0.363922119140625, -0.3428802490234375, -0.32183837890625, -0.3007965087890625, -0.279754638671875, -0.2587127685546875, -0.2376708984375, -0.2166290283203125, -0.195587158203125, -0.1745452880859375, -0.15350341796875, -0.1324615478515625, -0.111419677734375, -0.0903778076171875, -0.0693359375, -0.0482940673828125, -0.027252197265625, -0.0062103271484375, 0.01483154296875, 0.0358734130859375, 0.056915283203125, 0.0779571533203125, 0.0989990234375, 0.1200408935546875, 0.141082763671875, 0.1621246337890625, 0.18316650390625, 0.2042083740234375, 0.225250244140625, 0.2462921142578125, 0.267333984375, 0.2883758544921875, 0.309417724609375, 0.3304595947265625, 0.35150146484375, 0.3725433349609375, 0.393585205078125, 0.4146270751953125, 0.4356689453125, 0.4567108154296875, 0.477752685546875, 0.4987945556640625, 0.51983642578125, 0.5408782958984375, 0.561920166015625, 0.5829620361328125, 0.60400390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 18.0, 23.0, 42.0, 44.0, 60.0, 70.0, 71.0, 83.0, 88.0, 75.0, 75.0, 70.0, 74.0, 61.0, 34.0, 27.0, 26.0, 18.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2109375, -0.205047607421875, -0.19915771484375, -0.193267822265625, -0.1873779296875, -0.181488037109375, -0.17559814453125, -0.169708251953125, -0.163818359375, -0.157928466796875, -0.15203857421875, -0.146148681640625, -0.1402587890625, -0.134368896484375, -0.12847900390625, -0.122589111328125, -0.11669921875, -0.110809326171875, -0.10491943359375, -0.099029541015625, -0.0931396484375, -0.087249755859375, -0.08135986328125, -0.075469970703125, -0.069580078125, -0.063690185546875, -0.05780029296875, -0.051910400390625, -0.0460205078125, -0.040130615234375, -0.03424072265625, -0.028350830078125, -0.0224609375, -0.016571044921875, -0.01068115234375, -0.004791259765625, 0.0010986328125, 0.006988525390625, 0.01287841796875, 0.018768310546875, 0.024658203125, 0.030548095703125, 0.03643798828125, 0.042327880859375, 0.0482177734375, 0.054107666015625, 0.05999755859375, 0.065887451171875, 0.07177734375, 0.077667236328125, 0.08355712890625, 0.089447021484375, 0.0953369140625, 0.101226806640625, 0.10711669921875, 0.113006591796875, 0.118896484375, 0.124786376953125, 0.13067626953125, 0.136566162109375, 0.1424560546875, 0.148345947265625, 0.15423583984375, 0.160125732421875, 0.166015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 4.0, 10.0, 21.0, 22.0, 55.0, 60.0, 96.0, 157.0, 270.0, 430.0, 831.0, 1732.0, 4578.0, 20253.0, 389999.0, 3727023.0, 37437.0, 6777.0, 2179.0, 995.0, 523.0, 296.0, 171.0, 130.0, 81.0, 48.0, 36.0, 20.0, 19.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5810546875, -0.5624008178710938, -0.5437469482421875, -0.5250930786132812, -0.506439208984375, -0.48778533935546875, -0.4691314697265625, -0.45047760009765625, -0.43182373046875, -0.41316986083984375, -0.3945159912109375, -0.37586212158203125, -0.357208251953125, -0.33855438232421875, -0.3199005126953125, -0.30124664306640625, -0.2825927734375, -0.26393890380859375, -0.2452850341796875, -0.22663116455078125, -0.207977294921875, -0.18932342529296875, -0.1706695556640625, -0.15201568603515625, -0.13336181640625, -0.11470794677734375, -0.0960540771484375, -0.07740020751953125, -0.058746337890625, -0.04009246826171875, -0.0214385986328125, -0.00278472900390625, 0.015869140625, 0.03452301025390625, 0.0531768798828125, 0.07183074951171875, 0.090484619140625, 0.10913848876953125, 0.1277923583984375, 0.14644622802734375, 0.16510009765625, 0.18375396728515625, 0.2024078369140625, 0.22106170654296875, 0.239715576171875, 0.25836944580078125, 0.2770233154296875, 0.29567718505859375, 0.3143310546875, 0.33298492431640625, 0.3516387939453125, 0.37029266357421875, 0.388946533203125, 0.40760040283203125, 0.4262542724609375, 0.44490814208984375, 0.46356201171875, 0.48221588134765625, 0.5008697509765625, 0.5195236206054688, 0.538177490234375, 0.5568313598632812, 0.5754852294921875, 0.5941390991210938, 0.61279296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 11.0, 8.0, 14.0, 16.0, 45.0, 86.0, 506.0, 3039.0, 225.0, 66.0, 24.0, 12.0, 8.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5318679809570312, -0.5183258056640625, -0.5047836303710938, -0.491241455078125, -0.47769927978515625, -0.4641571044921875, -0.45061492919921875, -0.43707275390625, -0.42353057861328125, -0.4099884033203125, -0.39644622802734375, -0.382904052734375, -0.36936187744140625, -0.3558197021484375, -0.34227752685546875, -0.3287353515625, -0.31519317626953125, -0.3016510009765625, -0.28810882568359375, -0.274566650390625, -0.26102447509765625, -0.2474822998046875, -0.23394012451171875, -0.22039794921875, -0.20685577392578125, -0.1933135986328125, -0.17977142333984375, -0.166229248046875, -0.15268707275390625, -0.1391448974609375, -0.12560272216796875, -0.112060546875, -0.09851837158203125, -0.0849761962890625, -0.07143402099609375, -0.057891845703125, -0.04434967041015625, -0.0308074951171875, -0.01726531982421875, -0.00372314453125, 0.00981903076171875, 0.0233612060546875, 0.03690338134765625, 0.050445556640625, 0.06398773193359375, 0.0775299072265625, 0.09107208251953125, 0.1046142578125, 0.11815643310546875, 0.1316986083984375, 0.14524078369140625, 0.158782958984375, 0.17232513427734375, 0.1858673095703125, 0.19940948486328125, 0.21295166015625, 0.22649383544921875, 0.2400360107421875, 0.25357818603515625, 0.267120361328125, 0.28066253662109375, 0.2942047119140625, 0.30774688720703125, 0.3212890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 14.0, 36.0, 170.0, 467.0, 232.0, 49.0, 7.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.968031883239746, -3.87689208984375, -3.785752296447754, -3.694612503051758, -3.6034727096557617, -3.5123326778411865, -3.4211928844451904, -3.3300530910491943, -3.2389132976531982, -3.147773504257202, -3.056633710861206, -2.96549391746521, -2.8743538856506348, -2.7832140922546387, -2.6920742988586426, -2.6009345054626465, -2.5097947120666504, -2.4186549186706543, -2.327515125274658, -2.236375331878662, -2.145235538482666, -2.054095506668091, -1.9629557132720947, -1.8718159198760986, -1.7806761264801025, -1.6895363330841064, -1.5983965396881104, -1.5072566270828247, -1.4161168336868286, -1.3249770402908325, -1.2338371276855469, -1.1426973342895508, -1.0515577793121338, -0.9604179859161377, -0.8692781329154968, -0.778138279914856, -0.6869984865188599, -0.5958586931228638, -0.5047188401222229, -0.41357898712158203, -0.32243919372558594, -0.23129937052726746, -0.14015954732894897, -0.04901972413063049, 0.04212009906768799, 0.13325992226600647, 0.22439974546432495, 0.3155395984649658, 0.4066793918609619, 0.4978192150592804, 0.5889590382575989, 0.6800988912582397, 0.7712386846542358, 0.8623784780502319, 0.9535183310508728, 1.0446581840515137, 1.1357979774475098, 1.2269377708435059, 1.318077564239502, 1.4092174768447876, 1.5003572702407837, 1.5914970636367798, 1.6826369762420654, 1.7737767696380615, 1.8649165630340576]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 6.0, 4.0, 5.0, 9.0, 10.0, 15.0, 17.0, 16.0, 31.0, 31.0, 36.0, 42.0, 50.0, 54.0, 49.0, 68.0, 59.0, 54.0, 59.0, 40.0, 46.0, 57.0, 39.0, 33.0, 30.0, 27.0, 31.0, 25.0, 18.0, 13.0, 5.0, 9.0, 7.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6551198363304138, -0.6312218904495239, -0.6073240041732788, -0.5834261178970337, -0.5595281720161438, -0.5356302261352539, -0.5117323398590088, -0.4878344237804413, -0.4639365077018738, -0.4400385916233063, -0.41614067554473877, -0.39224275946617126, -0.36834484338760376, -0.34444692730903625, -0.32054901123046875, -0.29665109515190125, -0.27275317907333374, -0.24885526299476624, -0.22495734691619873, -0.20105943083763123, -0.17716151475906372, -0.15326359868049622, -0.1293656826019287, -0.1054677665233612, -0.0815698504447937, -0.057671934366226196, -0.03377401828765869, -0.009876102209091187, 0.014021813869476318, 0.03791972994804382, 0.06181764602661133, 0.08571556210517883, 0.10961341857910156, 0.13351133465766907, 0.15740925073623657, 0.18130716681480408, 0.20520508289337158, 0.2291029989719391, 0.2530009150505066, 0.2768988311290741, 0.3007967472076416, 0.3246946632862091, 0.3485925793647766, 0.3724904954433441, 0.3963884115219116, 0.4202863276004791, 0.44418424367904663, 0.46808215975761414, 0.49198007583618164, 0.5158779621124268, 0.5397759079933167, 0.5636738538742065, 0.5875717401504517, 0.6114696264266968, 0.6353675723075867, 0.6592655181884766, 0.6831634044647217, 0.7070612907409668, 0.7309592366218567, 0.7548571825027466, 0.7787550687789917, 0.8026529550552368, 0.8265509009361267, 0.8504488468170166, 0.8743467330932617]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 13.0, 21.0, 25.0, 44.0, 90.0, 195.0, 371.0, 995.0, 3540.0, 28818.0, 684001.0, 312748.0, 14004.0, 2321.0, 719.0, 309.0, 157.0, 90.0, 31.0, 20.0, 13.0, 12.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85888671875, -0.8335189819335938, -0.8081512451171875, -0.7827835083007812, -0.757415771484375, -0.7320480346679688, -0.7066802978515625, -0.6813125610351562, -0.65594482421875, -0.6305770874023438, -0.6052093505859375, -0.5798416137695312, -0.554473876953125, -0.5291061401367188, -0.5037384033203125, -0.47837066650390625, -0.4530029296875, -0.42763519287109375, -0.4022674560546875, -0.37689971923828125, -0.351531982421875, -0.32616424560546875, -0.3007965087890625, -0.27542877197265625, -0.25006103515625, -0.22469329833984375, -0.1993255615234375, -0.17395782470703125, -0.148590087890625, -0.12322235107421875, -0.0978546142578125, -0.07248687744140625, -0.047119140625, -0.02175140380859375, 0.0036163330078125, 0.02898406982421875, 0.054351806640625, 0.07971954345703125, 0.1050872802734375, 0.13045501708984375, 0.15582275390625, 0.18119049072265625, 0.2065582275390625, 0.23192596435546875, 0.257293701171875, 0.28266143798828125, 0.3080291748046875, 0.33339691162109375, 0.3587646484375, 0.38413238525390625, 0.4095001220703125, 0.43486785888671875, 0.460235595703125, 0.48560333251953125, 0.5109710693359375, 0.5363388061523438, 0.56170654296875, 0.5870742797851562, 0.6124420166015625, 0.6378097534179688, 0.663177490234375, 0.6885452270507812, 0.7139129638671875, 0.7392807006835938, 0.7646484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 34.0, 44.0, 57.0, 74.0, 64.0, 72.0, 73.0, 91.0, 87.0, 88.0, 53.0, 66.0, 56.0, 29.0, 24.0, 12.0, 17.0, 10.0, 0.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221435546875, -0.21514892578125, -0.2088623046875, -0.20257568359375, -0.1962890625, -0.19000244140625, -0.1837158203125, -0.17742919921875, -0.171142578125, -0.16485595703125, -0.1585693359375, -0.15228271484375, -0.14599609375, -0.13970947265625, -0.1334228515625, -0.12713623046875, -0.120849609375, -0.11456298828125, -0.1082763671875, -0.10198974609375, -0.095703125, -0.08941650390625, -0.0831298828125, -0.07684326171875, -0.070556640625, -0.06427001953125, -0.0579833984375, -0.05169677734375, -0.04541015625, -0.03912353515625, -0.0328369140625, -0.02655029296875, -0.020263671875, -0.01397705078125, -0.0076904296875, -0.00140380859375, 0.0048828125, 0.01116943359375, 0.0174560546875, 0.02374267578125, 0.030029296875, 0.03631591796875, 0.0426025390625, 0.04888916015625, 0.05517578125, 0.06146240234375, 0.0677490234375, 0.07403564453125, 0.080322265625, 0.08660888671875, 0.0928955078125, 0.09918212890625, 0.10546875, 0.11175537109375, 0.1180419921875, 0.12432861328125, 0.130615234375, 0.13690185546875, 0.1431884765625, 0.14947509765625, 0.15576171875, 0.16204833984375, 0.1683349609375, 0.17462158203125, 0.180908203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 3.0, 3.0, 26.0, 18.0, 25.0, 48.0, 84.0, 137.0, 214.0, 388.0, 825.0, 2079.0, 7520.0, 49578.0, 583976.0, 364060.0, 30900.0, 5451.0, 1672.0, 716.0, 356.0, 181.0, 95.0, 64.0, 41.0, 34.0, 20.0, 15.0, 11.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.450927734375, -0.43721771240234375, -0.4235076904296875, -0.40979766845703125, -0.396087646484375, -0.38237762451171875, -0.3686676025390625, -0.35495758056640625, -0.34124755859375, -0.32753753662109375, -0.3138275146484375, -0.30011749267578125, -0.286407470703125, -0.27269744873046875, -0.2589874267578125, -0.24527740478515625, -0.2315673828125, -0.21785736083984375, -0.2041473388671875, -0.19043731689453125, -0.176727294921875, -0.16301727294921875, -0.1493072509765625, -0.13559722900390625, -0.12188720703125, -0.10817718505859375, -0.0944671630859375, -0.08075714111328125, -0.067047119140625, -0.05333709716796875, -0.0396270751953125, -0.02591705322265625, -0.01220703125, 0.00150299072265625, 0.0152130126953125, 0.02892303466796875, 0.042633056640625, 0.05634307861328125, 0.0700531005859375, 0.08376312255859375, 0.09747314453125, 0.11118316650390625, 0.1248931884765625, 0.13860321044921875, 0.152313232421875, 0.16602325439453125, 0.1797332763671875, 0.19344329833984375, 0.2071533203125, 0.22086334228515625, 0.2345733642578125, 0.24828338623046875, 0.261993408203125, 0.27570343017578125, 0.2894134521484375, 0.30312347412109375, 0.31683349609375, 0.33054351806640625, 0.3442535400390625, 0.35796356201171875, 0.371673583984375, 0.38538360595703125, 0.3990936279296875, 0.41280364990234375, 0.426513671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 4.0, 11.0, 12.0, 11.0, 12.0, 18.0, 33.0, 29.0, 36.0, 39.0, 58.0, 48.0, 47.0, 47.0, 64.0, 51.0, 56.0, 62.0, 49.0, 53.0, 44.0, 40.0, 26.0, 36.0, 25.0, 24.0, 23.0, 12.0, 4.0, 8.0, 8.0, 3.0, 8.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478271484375, -0.4603157043457031, -0.44235992431640625, -0.4244041442871094, -0.4064483642578125, -0.3884925842285156, -0.37053680419921875, -0.3525810241699219, -0.334625244140625, -0.3166694641113281, -0.29871368408203125, -0.2807579040527344, -0.2628021240234375, -0.24484634399414062, -0.22689056396484375, -0.20893478393554688, -0.19097900390625, -0.17302322387695312, -0.15506744384765625, -0.13711166381835938, -0.1191558837890625, -0.10120010375976562, -0.08324432373046875, -0.06528854370117188, -0.047332763671875, -0.029376983642578125, -0.01142120361328125, 0.006534576416015625, 0.0244903564453125, 0.042446136474609375, 0.06040191650390625, 0.07835769653320312, 0.0963134765625, 0.11426925659179688, 0.13222503662109375, 0.15018081665039062, 0.1681365966796875, 0.18609237670898438, 0.20404815673828125, 0.22200393676757812, 0.239959716796875, 0.2579154968261719, 0.27587127685546875, 0.2938270568847656, 0.3117828369140625, 0.3297386169433594, 0.34769439697265625, 0.3656501770019531, 0.38360595703125, 0.4015617370605469, 0.41951751708984375, 0.4374732971191406, 0.4554290771484375, 0.4733848571777344, 0.49134063720703125, 0.5092964172363281, 0.527252197265625, 0.5452079772949219, 0.5631637573242188, 0.5811195373535156, 0.5990753173828125, 0.6170310974121094, 0.6349868774414062, 0.6529426574707031, 0.6708984375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 20.0, 49.0, 90.0, 225.0, 667.0, 3176.0, 38517.0, 849630.0, 147948.0, 6530.0, 1113.0, 343.0, 118.0, 54.0, 26.0, 12.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.31324195861816406, -0.3044624328613281, -0.2956829071044922, -0.28690338134765625, -0.2781238555908203, -0.2693443298339844, -0.26056480407714844, -0.2517852783203125, -0.24300575256347656, -0.23422622680664062, -0.2254467010498047, -0.21666717529296875, -0.2078876495361328, -0.19910812377929688, -0.19032859802246094, -0.181549072265625, -0.17276954650878906, -0.16399002075195312, -0.1552104949951172, -0.14643096923828125, -0.1376514434814453, -0.12887191772460938, -0.12009239196777344, -0.1113128662109375, -0.10253334045410156, -0.09375381469726562, -0.08497428894042969, -0.07619476318359375, -0.06741523742675781, -0.058635711669921875, -0.04985618591308594, -0.04107666015625, -0.03229713439941406, -0.023517608642578125, -0.014738082885742188, -0.00595855712890625, 0.0028209686279296875, 0.011600494384765625, 0.020380020141601562, 0.0291595458984375, 0.03793907165527344, 0.046718597412109375, 0.05549812316894531, 0.06427764892578125, 0.07305717468261719, 0.08183670043945312, 0.09061622619628906, 0.099395751953125, 0.10817527770996094, 0.11695480346679688, 0.1257343292236328, 0.13451385498046875, 0.1432933807373047, 0.15207290649414062, 0.16085243225097656, 0.1696319580078125, 0.17841148376464844, 0.18719100952148438, 0.1959705352783203, 0.20475006103515625, 0.2135295867919922, 0.22230911254882812, 0.23108863830566406, 0.2398681640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 5.0, 12.0, 10.0, 15.0, 17.0, 21.0, 27.0, 33.0, 54.0, 63.0, 70.0, 101.0, 104.0, 93.0, 75.0, 58.0, 50.0, 36.0, 22.0, 27.0, 25.0, 15.0, 7.0, 16.0, 5.0, 7.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014388561248779297, -0.0001390315592288971, -0.00013417750597000122, -0.00012932345271110535, -0.00012446939945220947, -0.0001196153461933136, -0.00011476129293441772, -0.00010990723967552185, -0.00010505318641662598, -0.0001001991331577301, -9.534507989883423e-05, -9.049102663993835e-05, -8.563697338104248e-05, -8.07829201221466e-05, -7.592886686325073e-05, -7.107481360435486e-05, -6.622076034545898e-05, -6.136670708656311e-05, -5.6512653827667236e-05, -5.165860056877136e-05, -4.680454730987549e-05, -4.1950494050979614e-05, -3.709644079208374e-05, -3.2242387533187866e-05, -2.7388334274291992e-05, -2.2534281015396118e-05, -1.7680227756500244e-05, -1.282617449760437e-05, -7.972121238708496e-06, -3.118067979812622e-06, 1.735985279083252e-06, 6.590038537979126e-06, 1.1444091796875e-05, 1.6298145055770874e-05, 2.1152198314666748e-05, 2.6006251573562622e-05, 3.0860304832458496e-05, 3.571435809135437e-05, 4.0568411350250244e-05, 4.542246460914612e-05, 5.027651786804199e-05, 5.5130571126937866e-05, 5.998462438583374e-05, 6.483867764472961e-05, 6.969273090362549e-05, 7.454678416252136e-05, 7.940083742141724e-05, 8.425489068031311e-05, 8.910894393920898e-05, 9.396299719810486e-05, 9.881705045700073e-05, 0.0001036711037158966, 0.00010852515697479248, 0.00011337921023368835, 0.00011823326349258423, 0.0001230873167514801, 0.00012794137001037598, 0.00013279542326927185, 0.00013764947652816772, 0.0001425035297870636, 0.00014735758304595947, 0.00015221163630485535, 0.00015706568956375122, 0.0001619197428226471, 0.00016677379608154297]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 16.0, 17.0, 49.0, 88.0, 229.0, 715.0, 3580.0, 77920.0, 920452.0, 41801.0, 2787.0, 512.0, 223.0, 76.0, 41.0, 19.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.292236328125, -0.2819557189941406, -0.27167510986328125, -0.2613945007324219, -0.2511138916015625, -0.24083328247070312, -0.23055267333984375, -0.22027206420898438, -0.209991455078125, -0.19971084594726562, -0.18943023681640625, -0.17914962768554688, -0.1688690185546875, -0.15858840942382812, -0.14830780029296875, -0.13802719116210938, -0.12774658203125, -0.11746597290039062, -0.10718536376953125, -0.09690475463867188, -0.0866241455078125, -0.07634353637695312, -0.06606292724609375, -0.055782318115234375, -0.045501708984375, -0.035221099853515625, -0.02494049072265625, -0.014659881591796875, -0.0043792724609375, 0.005901336669921875, 0.01618194580078125, 0.026462554931640625, 0.0367431640625, 0.047023773193359375, 0.05730438232421875, 0.06758499145507812, 0.0778656005859375, 0.08814620971679688, 0.09842681884765625, 0.10870742797851562, 0.118988037109375, 0.12926864624023438, 0.13954925537109375, 0.14982986450195312, 0.1601104736328125, 0.17039108276367188, 0.18067169189453125, 0.19095230102539062, 0.20123291015625, 0.21151351928710938, 0.22179412841796875, 0.23207473754882812, 0.2423553466796875, 0.2526359558105469, 0.26291656494140625, 0.2731971740722656, 0.283477783203125, 0.2937583923339844, 0.30403900146484375, 0.3143196105957031, 0.3246002197265625, 0.3348808288574219, 0.34516143798828125, 0.3554420471191406, 0.36572265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 1.0, 4.0, 11.0, 8.0, 18.0, 47.0, 62.0, 130.0, 153.0, 187.0, 138.0, 93.0, 73.0, 36.0, 13.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14160728454589844, -0.13294601440429688, -0.12428474426269531, -0.11562347412109375, -0.10696220397949219, -0.09830093383789062, -0.08963966369628906, -0.0809783935546875, -0.07231712341308594, -0.06365585327148438, -0.05499458312988281, -0.04633331298828125, -0.03767204284667969, -0.029010772705078125, -0.020349502563476562, -0.011688232421875, -0.0030269622802734375, 0.005634307861328125, 0.014295578002929688, 0.02295684814453125, 0.03161811828613281, 0.040279388427734375, 0.04894065856933594, 0.0576019287109375, 0.06626319885253906, 0.07492446899414062, 0.08358573913574219, 0.09224700927734375, 0.10090827941894531, 0.10956954956054688, 0.11823081970214844, 0.12689208984375, 0.13555335998535156, 0.14421463012695312, 0.1528759002685547, 0.16153717041015625, 0.1701984405517578, 0.17885971069335938, 0.18752098083496094, 0.1961822509765625, 0.20484352111816406, 0.21350479125976562, 0.2221660614013672, 0.23082733154296875, 0.2394886016845703, 0.24814987182617188, 0.25681114196777344, 0.265472412109375, 0.27413368225097656, 0.2827949523925781, 0.2914562225341797, 0.30011749267578125, 0.3087787628173828, 0.3174400329589844, 0.32610130310058594, 0.3347625732421875, 0.34342384338378906, 0.3520851135253906, 0.3607463836669922, 0.36940765380859375, 0.3780689239501953, 0.3867301940917969, 0.39539146423339844, 0.404052734375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 28.0, 54.0, 112.0, 204.0, 240.0, 179.0, 94.0, 38.0, 13.0, 14.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6615819931030273, -3.5490167140960693, -3.4364516735076904, -3.3238863945007324, -3.2113211154937744, -3.0987558364868164, -2.9861907958984375, -2.8736255168914795, -2.7610602378845215, -2.6484949588775635, -2.5359299182891846, -2.4233646392822266, -2.3107993602752686, -2.1982340812683105, -2.0856690406799316, -1.9731037616729736, -1.8605386018753052, -1.7479734420776367, -1.6354081630706787, -1.5228430032730103, -1.4102777242660522, -1.2977125644683838, -1.1851472854614258, -1.0725821256637573, -0.9600169062614441, -0.8474516868591309, -0.7348864674568176, -0.6223212480545044, -0.5097560882568359, -0.3971908688545227, -0.2846256494522095, -0.17206043004989624, -0.05949521064758301, 0.05307000130414963, 0.16563521325588226, 0.2782004177570343, 0.39076563715934753, 0.5033308267593384, 0.6158960461616516, 0.7284612655639648, 0.8410264849662781, 0.9535917043685913, 1.0661568641662598, 1.1787221431732178, 1.2912873029708862, 1.4038524627685547, 1.5164177417755127, 1.6289830207824707, 1.7415481805801392, 1.8541133403778076, 1.9666786193847656, 2.0792438983917236, 2.1918089389801025, 2.3043742179870605, 2.4169394969940186, 2.5295047760009766, 2.6420698165893555, 2.7546350955963135, 2.8672001361846924, 2.9797654151916504, 3.0923306941986084, 3.2048959732055664, 3.3174610137939453, 3.4300262928009033, 3.5425915718078613]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 2.0, 7.0, 8.0, 13.0, 13.0, 17.0, 11.0, 19.0, 16.0, 24.0, 27.0, 23.0, 40.0, 38.0, 37.0, 38.0, 44.0, 43.0, 51.0, 42.0, 34.0, 37.0, 49.0, 45.0, 48.0, 36.0, 36.0, 16.0, 26.0, 26.0, 18.0, 20.0, 22.0, 12.0, 13.0, 7.0, 7.0, 7.0, 7.0, 0.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.4537458419799805, -2.3853323459625244, -2.3169188499450684, -2.2485053539276123, -2.1800918579101562, -2.111678123474121, -2.043264627456665, -1.974851131439209, -1.906437635421753, -1.8380241394042969, -1.7696106433868408, -1.7011970281600952, -1.6327835321426392, -1.564370036125183, -1.4959564208984375, -1.4275429248809814, -1.3591294288635254, -1.2907159328460693, -1.2223024368286133, -1.1538888216018677, -1.0854753255844116, -1.0170618295669556, -0.9486482739448547, -0.8802347183227539, -0.8118212223052979, -0.7434077262878418, -0.674994170665741, -0.6065806150436401, -0.5381671190261841, -0.46975359320640564, -0.4013400673866272, -0.33292654156684875, -0.2645127773284912, -0.19609925150871277, -0.12768572568893433, -0.059272199869155884, 0.009141325950622559, 0.077554851770401, 0.14596837759017944, 0.21438190340995789, 0.28279542922973633, 0.35120895504951477, 0.4196224808692932, 0.48803600668907166, 0.5564495325088501, 0.6248630285263062, 0.693276584148407, 0.7616901397705078, 0.8301036357879639, 0.8985171318054199, 0.9669306874275208, 1.0353442430496216, 1.1037577390670776, 1.1721712350845337, 1.2405848503112793, 1.3089983463287354, 1.3774118423461914, 1.4458253383636475, 1.5142388343811035, 1.5826524496078491, 1.6510659456253052, 1.7194794416427612, 1.7878930568695068, 1.856306552886963, 1.924720048904419]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 9.0, 4.0, 13.0, 14.0, 25.0, 45.0, 43.0, 100.0, 134.0, 201.0, 413.0, 1472.0, 39169.0, 4148656.0, 2715.0, 552.0, 290.0, 156.0, 88.0, 58.0, 43.0, 25.0, 16.0, 8.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6708984375, -1.6204986572265625, -1.570098876953125, -1.5196990966796875, -1.46929931640625, -1.4188995361328125, -1.368499755859375, -1.3180999755859375, -1.2677001953125, -1.2173004150390625, -1.166900634765625, -1.1165008544921875, -1.06610107421875, -1.0157012939453125, -0.965301513671875, -0.9149017333984375, -0.864501953125, -0.8141021728515625, -0.763702392578125, -0.7133026123046875, -0.66290283203125, -0.6125030517578125, -0.562103271484375, -0.5117034912109375, -0.4613037109375, -0.4109039306640625, -0.360504150390625, -0.3101043701171875, -0.25970458984375, -0.2093048095703125, -0.158905029296875, -0.1085052490234375, -0.05810546875, -0.0077056884765625, 0.042694091796875, 0.0930938720703125, 0.14349365234375, 0.1938934326171875, 0.244293212890625, 0.2946929931640625, 0.3450927734375, 0.3954925537109375, 0.445892333984375, 0.4962921142578125, 0.54669189453125, 0.5970916748046875, 0.647491455078125, 0.6978912353515625, 0.748291015625, 0.7986907958984375, 0.849090576171875, 0.8994903564453125, 0.94989013671875, 1.0002899169921875, 1.050689697265625, 1.1010894775390625, 1.1514892578125, 1.2018890380859375, 1.252288818359375, 1.3026885986328125, 1.35308837890625, 1.4034881591796875, 1.453887939453125, 1.5042877197265625, 1.5546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 2.0, 5.0, 5.0, 14.0, 16.0, 31.0, 28.0, 34.0, 37.0, 53.0, 68.0, 57.0, 63.0, 79.0, 76.0, 66.0, 72.0, 68.0, 56.0, 44.0, 31.0, 23.0, 15.0, 20.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.221923828125, -0.2158985137939453, -0.20987319946289062, -0.20384788513183594, -0.19782257080078125, -0.19179725646972656, -0.18577194213867188, -0.1797466278076172, -0.1737213134765625, -0.1676959991455078, -0.16167068481445312, -0.15564537048339844, -0.14962005615234375, -0.14359474182128906, -0.13756942749023438, -0.1315441131591797, -0.125518798828125, -0.11949348449707031, -0.11346817016601562, -0.10744285583496094, -0.10141754150390625, -0.09539222717285156, -0.08936691284179688, -0.08334159851074219, -0.0773162841796875, -0.07129096984863281, -0.06526565551757812, -0.05924034118652344, -0.05321502685546875, -0.04718971252441406, -0.041164398193359375, -0.03513908386230469, -0.02911376953125, -0.023088455200195312, -0.017063140869140625, -0.011037826538085938, -0.00501251220703125, 0.0010128021240234375, 0.007038116455078125, 0.013063430786132812, 0.0190887451171875, 0.025114059448242188, 0.031139373779296875, 0.03716468811035156, 0.04319000244140625, 0.04921531677246094, 0.055240631103515625, 0.06126594543457031, 0.067291259765625, 0.07331657409667969, 0.07934188842773438, 0.08536720275878906, 0.09139251708984375, 0.09741783142089844, 0.10344314575195312, 0.10946846008300781, 0.1154937744140625, 0.12151908874511719, 0.12754440307617188, 0.13356971740722656, 0.13959503173828125, 0.14562034606933594, 0.15164566040039062, 0.1576709747314453, 0.1636962890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 9.0, 5.0, 18.0, 22.0, 28.0, 39.0, 48.0, 80.0, 79.0, 115.0, 168.0, 248.0, 322.0, 526.0, 852.0, 1684.0, 3561.0, 9771.0, 52785.0, 4059514.0, 47402.0, 9372.0, 3562.0, 1592.0, 877.0, 495.0, 341.0, 231.0, 149.0, 124.0, 85.0, 44.0, 45.0, 19.0, 20.0, 12.0, 8.0, 10.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3459434509277344, -0.33495330810546875, -0.3239631652832031, -0.3129730224609375, -0.3019828796386719, -0.29099273681640625, -0.2800025939941406, -0.269012451171875, -0.2580223083496094, -0.24703216552734375, -0.23604202270507812, -0.2250518798828125, -0.21406173706054688, -0.20307159423828125, -0.19208145141601562, -0.18109130859375, -0.17010116577148438, -0.15911102294921875, -0.14812088012695312, -0.1371307373046875, -0.12614059448242188, -0.11515045166015625, -0.10416030883789062, -0.093170166015625, -0.08218002319335938, -0.07118988037109375, -0.060199737548828125, -0.0492095947265625, -0.038219451904296875, -0.02722930908203125, -0.016239166259765625, -0.0052490234375, 0.005741119384765625, 0.01673126220703125, 0.027721405029296875, 0.0387115478515625, 0.049701690673828125, 0.06069183349609375, 0.07168197631835938, 0.082672119140625, 0.09366226196289062, 0.10465240478515625, 0.11564254760742188, 0.1266326904296875, 0.13762283325195312, 0.14861297607421875, 0.15960311889648438, 0.17059326171875, 0.18158340454101562, 0.19257354736328125, 0.20356369018554688, 0.2145538330078125, 0.22554397583007812, 0.23653411865234375, 0.24752426147460938, 0.258514404296875, 0.2695045471191406, 0.28049468994140625, 0.2914848327636719, 0.3024749755859375, 0.3134651184082031, 0.32445526123046875, 0.3354454040527344, 0.346435546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 14.0, 23.0, 120.0, 3665.0, 164.0, 33.0, 18.0, 11.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15996646881103516, -0.1561145782470703, -0.15226268768310547, -0.14841079711914062, -0.14455890655517578, -0.14070701599121094, -0.1368551254272461, -0.13300323486328125, -0.1291513442993164, -0.12529945373535156, -0.12144756317138672, -0.11759567260742188, -0.11374378204345703, -0.10989189147949219, -0.10604000091552734, -0.1021881103515625, -0.09833621978759766, -0.09448432922363281, -0.09063243865966797, -0.08678054809570312, -0.08292865753173828, -0.07907676696777344, -0.0752248764038086, -0.07137298583984375, -0.0675210952758789, -0.06366920471191406, -0.05981731414794922, -0.055965423583984375, -0.05211353302001953, -0.04826164245605469, -0.044409751892089844, -0.040557861328125, -0.036705970764160156, -0.03285408020019531, -0.02900218963623047, -0.025150299072265625, -0.02129840850830078, -0.017446517944335938, -0.013594627380371094, -0.00974273681640625, -0.005890846252441406, -0.0020389556884765625, 0.0018129348754882812, 0.005664825439453125, 0.009516716003417969, 0.013368606567382812, 0.017220497131347656, 0.0210723876953125, 0.024924278259277344, 0.028776168823242188, 0.03262805938720703, 0.036479949951171875, 0.04033184051513672, 0.04418373107910156, 0.048035621643066406, 0.05188751220703125, 0.055739402770996094, 0.05959129333496094, 0.06344318389892578, 0.06729507446289062, 0.07114696502685547, 0.07499885559082031, 0.07885074615478516, 0.08270263671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 13.0, 21.0, 61.0, 105.0, 168.0, 239.0, 186.0, 102.0, 61.0, 21.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35893046855926514, -0.3456893265247345, -0.33244821429252625, -0.3192070722579956, -0.30596593022346497, -0.2927247881889343, -0.2794836759567261, -0.26624253392219543, -0.2530013918876648, -0.23976026475429535, -0.2265191227197647, -0.21327799558639526, -0.20003685355186462, -0.18679572641849518, -0.17355459928512573, -0.1603134572505951, -0.14707234501838684, -0.1338312178850174, -0.12059007585048676, -0.10734894871711731, -0.09410781413316727, -0.08086667954921722, -0.06762555241584778, -0.054384417831897736, -0.04114328324794769, -0.0279021505266428, -0.014661017805337906, -0.0014198869466781616, 0.011821247637271881, 0.025062382221221924, 0.03830350935459137, 0.05154464393854141, 0.06478574872016907, 0.07802688330411911, 0.09126801788806915, 0.1045091450214386, 0.11775027960538864, 0.13099141418933868, 0.14423254132270813, 0.15747368335723877, 0.17071481049060822, 0.18395593762397766, 0.1971970796585083, 0.21043820679187775, 0.2236793339252472, 0.23692047595977783, 0.2501615881919861, 0.2634027302265167, 0.27664387226104736, 0.289885014295578, 0.30312612652778625, 0.3163672685623169, 0.32960841059684753, 0.3428495526313782, 0.3560906648635864, 0.36933180689811707, 0.3825729489326477, 0.39581409096717834, 0.4090552031993866, 0.42229634523391724, 0.4355374872684479, 0.4487786293029785, 0.46201974153518677, 0.4752608835697174, 0.48850199580192566]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 8.0, 10.0, 8.0, 8.0, 25.0, 20.0, 16.0, 14.0, 28.0, 28.0, 33.0, 41.0, 29.0, 28.0, 34.0, 36.0, 43.0, 47.0, 35.0, 48.0, 49.0, 30.0, 32.0, 35.0, 33.0, 31.0, 35.0, 31.0, 32.0, 23.0, 21.0, 17.0, 15.0, 8.0, 7.0, 9.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15804731845855713, -0.15313029289245605, -0.1482132524251938, -0.1432962268590927, -0.13837918639183044, -0.13346216082572937, -0.1285451203584671, -0.12362809479236603, -0.11871106177568436, -0.11379402875900269, -0.10887699574232101, -0.10395996272563934, -0.09904293715953827, -0.094125896692276, -0.08920887112617493, -0.08429183810949326, -0.07937480509281158, -0.07445777207612991, -0.06954073905944824, -0.06462370604276657, -0.0597066767513752, -0.05478964373469353, -0.049872614443302155, -0.04495558142662048, -0.04003854840993881, -0.03512151539325714, -0.03020448423922062, -0.025287453085184097, -0.020370420068502426, -0.015453387051820755, -0.010536355897784233, -0.005619324743747711, -0.00070229172706604, 0.0042147403582930565, 0.009131772443652153, 0.01404880452901125, 0.018965836614370346, 0.023882869631052017, 0.02879990078508854, 0.03371693193912506, 0.03863396495580673, 0.0435509979724884, 0.048468030989170074, 0.05338506028056145, 0.05830209329724312, 0.06321913003921509, 0.06813615560531616, 0.07305318862199783, 0.0779702216386795, 0.08288725465536118, 0.08780428767204285, 0.09272132068872452, 0.09763835370540619, 0.10255537927150726, 0.10747241228818893, 0.1123894453048706, 0.11730647832155228, 0.12222351133823395, 0.12714053690433502, 0.1320575773715973, 0.13697460293769836, 0.14189164340496063, 0.1468086689710617, 0.15172570943832397, 0.15664273500442505]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 8.0, 9.0, 14.0, 20.0, 32.0, 42.0, 63.0, 97.0, 123.0, 184.0, 265.0, 400.0, 608.0, 1187.0, 2294.0, 5076.0, 12257.0, 35721.0, 121031.0, 371742.0, 340346.0, 104746.0, 31591.0, 11169.0, 4576.0, 2085.0, 1105.0, 594.0, 370.0, 224.0, 172.0, 115.0, 89.0, 53.0, 38.0, 32.0, 13.0, 18.0, 15.0, 7.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29784393310546875, -0.2888031005859375, -0.27976226806640625, -0.270721435546875, -0.26168060302734375, -0.2526397705078125, -0.24359893798828125, -0.23455810546875, -0.22551727294921875, -0.2164764404296875, -0.20743560791015625, -0.198394775390625, -0.18935394287109375, -0.1803131103515625, -0.17127227783203125, -0.1622314453125, -0.15319061279296875, -0.1441497802734375, -0.13510894775390625, -0.126068115234375, -0.11702728271484375, -0.1079864501953125, -0.09894561767578125, -0.08990478515625, -0.08086395263671875, -0.0718231201171875, -0.06278228759765625, -0.053741455078125, -0.04470062255859375, -0.0356597900390625, -0.02661895751953125, -0.017578125, -0.00853729248046875, 0.0005035400390625, 0.00954437255859375, 0.018585205078125, 0.02762603759765625, 0.0366668701171875, 0.04570770263671875, 0.05474853515625, 0.06378936767578125, 0.0728302001953125, 0.08187103271484375, 0.090911865234375, 0.09995269775390625, 0.1089935302734375, 0.11803436279296875, 0.1270751953125, 0.13611602783203125, 0.1451568603515625, 0.15419769287109375, 0.163238525390625, 0.17227935791015625, 0.1813201904296875, 0.19036102294921875, 0.19940185546875, 0.20844268798828125, 0.2174835205078125, 0.22652435302734375, 0.235565185546875, 0.24460601806640625, 0.2536468505859375, 0.26268768310546875, 0.271728515625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 13.0, 6.0, 28.0, 21.0, 24.0, 26.0, 35.0, 43.0, 50.0, 68.0, 69.0, 65.0, 60.0, 65.0, 73.0, 66.0, 67.0, 46.0, 41.0, 33.0, 24.0, 23.0, 13.0, 8.0, 13.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2242431640625, -0.2181072235107422, -0.21197128295898438, -0.20583534240722656, -0.19969940185546875, -0.19356346130371094, -0.18742752075195312, -0.1812915802001953, -0.1751556396484375, -0.1690196990966797, -0.16288375854492188, -0.15674781799316406, -0.15061187744140625, -0.14447593688964844, -0.13833999633789062, -0.1322040557861328, -0.126068115234375, -0.11993217468261719, -0.11379623413085938, -0.10766029357910156, -0.10152435302734375, -0.09538841247558594, -0.08925247192382812, -0.08311653137207031, -0.0769805908203125, -0.07084465026855469, -0.06470870971679688, -0.05857276916503906, -0.05243682861328125, -0.04630088806152344, -0.040164947509765625, -0.03402900695800781, -0.02789306640625, -0.021757125854492188, -0.015621185302734375, -0.009485244750976562, -0.00334930419921875, 0.0027866363525390625, 0.008922576904296875, 0.015058517456054688, 0.0211944580078125, 0.027330398559570312, 0.033466339111328125, 0.03960227966308594, 0.04573822021484375, 0.05187416076660156, 0.058010101318359375, 0.06414604187011719, 0.070281982421875, 0.07641792297363281, 0.08255386352539062, 0.08868980407714844, 0.09482574462890625, 0.10096168518066406, 0.10709762573242188, 0.11323356628417969, 0.1193695068359375, 0.1255054473876953, 0.13164138793945312, 0.13777732849121094, 0.14391326904296875, 0.15004920959472656, 0.15618515014648438, 0.1623210906982422, 0.16845703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 6.0, 4.0, 9.0, 14.0, 21.0, 29.0, 33.0, 61.0, 74.0, 121.0, 224.0, 326.0, 565.0, 1117.0, 2897.0, 10526.0, 59533.0, 459226.0, 440968.0, 57024.0, 10346.0, 2898.0, 1118.0, 558.0, 330.0, 190.0, 131.0, 65.0, 54.0, 36.0, 23.0, 14.0, 6.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363037109375, -0.3516883850097656, -0.34033966064453125, -0.3289909362792969, -0.3176422119140625, -0.3062934875488281, -0.29494476318359375, -0.2835960388183594, -0.272247314453125, -0.2608985900878906, -0.24954986572265625, -0.23820114135742188, -0.2268524169921875, -0.21550369262695312, -0.20415496826171875, -0.19280624389648438, -0.18145751953125, -0.17010879516601562, -0.15876007080078125, -0.14741134643554688, -0.1360626220703125, -0.12471389770507812, -0.11336517333984375, -0.10201644897460938, -0.090667724609375, -0.07931900024414062, -0.06797027587890625, -0.056621551513671875, -0.0452728271484375, -0.033924102783203125, -0.02257537841796875, -0.011226654052734375, 0.0001220703125, 0.011470794677734375, 0.02281951904296875, 0.034168243408203125, 0.0455169677734375, 0.056865692138671875, 0.06821441650390625, 0.07956314086914062, 0.090911865234375, 0.10226058959960938, 0.11360931396484375, 0.12495803833007812, 0.1363067626953125, 0.14765548706054688, 0.15900421142578125, 0.17035293579101562, 0.18170166015625, 0.19305038452148438, 0.20439910888671875, 0.21574783325195312, 0.2270965576171875, 0.23844528198242188, 0.24979400634765625, 0.2611427307128906, 0.272491455078125, 0.2838401794433594, 0.29518890380859375, 0.3065376281738281, 0.3178863525390625, 0.3292350769042969, 0.34058380126953125, 0.3519325256347656, 0.36328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 11.0, 5.0, 10.0, 9.0, 8.0, 14.0, 17.0, 23.0, 27.0, 27.0, 32.0, 50.0, 40.0, 48.0, 61.0, 39.0, 41.0, 65.0, 50.0, 41.0, 50.0, 43.0, 39.0, 44.0, 37.0, 30.0, 33.0, 27.0, 21.0, 17.0, 7.0, 13.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69970703125, -0.67938232421875, -0.6590576171875, -0.63873291015625, -0.618408203125, -0.59808349609375, -0.5777587890625, -0.55743408203125, -0.537109375, -0.51678466796875, -0.4964599609375, -0.47613525390625, -0.455810546875, -0.43548583984375, -0.4151611328125, -0.39483642578125, -0.37451171875, -0.35418701171875, -0.3338623046875, -0.31353759765625, -0.293212890625, -0.27288818359375, -0.2525634765625, -0.23223876953125, -0.2119140625, -0.19158935546875, -0.1712646484375, -0.15093994140625, -0.130615234375, -0.11029052734375, -0.0899658203125, -0.06964111328125, -0.04931640625, -0.02899169921875, -0.0086669921875, 0.01165771484375, 0.031982421875, 0.05230712890625, 0.0726318359375, 0.09295654296875, 0.11328125, 0.13360595703125, 0.1539306640625, 0.17425537109375, 0.194580078125, 0.21490478515625, 0.2352294921875, 0.25555419921875, 0.27587890625, 0.29620361328125, 0.3165283203125, 0.33685302734375, 0.357177734375, 0.37750244140625, 0.3978271484375, 0.41815185546875, 0.4384765625, 0.45880126953125, 0.4791259765625, 0.49945068359375, 0.519775390625, 0.54010009765625, 0.5604248046875, 0.58074951171875, 0.60107421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 16.0, 31.0, 54.0, 120.0, 209.0, 651.0, 1980.0, 8954.0, 115927.0, 850253.0, 61387.0, 6341.0, 1576.0, 576.0, 236.0, 110.0, 51.0, 24.0, 13.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.2357196807861328, -0.22742080688476562, -0.21912193298339844, -0.21082305908203125, -0.20252418518066406, -0.19422531127929688, -0.1859264373779297, -0.1776275634765625, -0.1693286895751953, -0.16102981567382812, -0.15273094177246094, -0.14443206787109375, -0.13613319396972656, -0.12783432006835938, -0.11953544616699219, -0.111236572265625, -0.10293769836425781, -0.09463882446289062, -0.08633995056152344, -0.07804107666015625, -0.06974220275878906, -0.061443328857421875, -0.05314445495605469, -0.0448455810546875, -0.03654670715332031, -0.028247833251953125, -0.019948959350585938, -0.01165008544921875, -0.0033512115478515625, 0.004947662353515625, 0.013246536254882812, 0.02154541015625, 0.029844284057617188, 0.038143157958984375, 0.04644203186035156, 0.05474090576171875, 0.06303977966308594, 0.07133865356445312, 0.07963752746582031, 0.0879364013671875, 0.09623527526855469, 0.10453414916992188, 0.11283302307128906, 0.12113189697265625, 0.12943077087402344, 0.13772964477539062, 0.1460285186767578, 0.154327392578125, 0.1626262664794922, 0.17092514038085938, 0.17922401428222656, 0.18752288818359375, 0.19582176208496094, 0.20412063598632812, 0.2124195098876953, 0.2207183837890625, 0.2290172576904297, 0.23731613159179688, 0.24561500549316406, 0.25391387939453125, 0.26221275329589844, 0.2705116271972656, 0.2788105010986328, 0.287109375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 7.0, 3.0, 4.0, 5.0, 7.0, 17.0, 11.0, 11.0, 16.0, 23.0, 32.0, 38.0, 47.0, 66.0, 73.0, 85.0, 108.0, 88.0, 61.0, 65.0, 53.0, 48.0, 35.0, 13.0, 12.0, 14.0, 18.0, 6.0, 7.0, 2.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.554624557495117e-05, -9.220093488693237e-05, -8.885562419891357e-05, -8.551031351089478e-05, -8.216500282287598e-05, -7.881969213485718e-05, -7.547438144683838e-05, -7.212907075881958e-05, -6.878376007080078e-05, -6.543844938278198e-05, -6.209313869476318e-05, -5.8747828006744385e-05, -5.5402517318725586e-05, -5.205720663070679e-05, -4.871189594268799e-05, -4.536658525466919e-05, -4.202127456665039e-05, -3.867596387863159e-05, -3.533065319061279e-05, -3.1985342502593994e-05, -2.8640031814575195e-05, -2.5294721126556396e-05, -2.1949410438537598e-05, -1.86040997505188e-05, -1.52587890625e-05, -1.1913478374481201e-05, -8.568167686462402e-06, -5.2228569984436035e-06, -1.8775463104248047e-06, 1.4677643775939941e-06, 4.813075065612793e-06, 8.158385753631592e-06, 1.150369644165039e-05, 1.484900712966919e-05, 1.8194317817687988e-05, 2.1539628505706787e-05, 2.4884939193725586e-05, 2.8230249881744385e-05, 3.1575560569763184e-05, 3.492087125778198e-05, 3.826618194580078e-05, 4.161149263381958e-05, 4.495680332183838e-05, 4.830211400985718e-05, 5.1647424697875977e-05, 5.4992735385894775e-05, 5.8338046073913574e-05, 6.168335676193237e-05, 6.502866744995117e-05, 6.837397813796997e-05, 7.171928882598877e-05, 7.506459951400757e-05, 7.840991020202637e-05, 8.175522089004517e-05, 8.510053157806396e-05, 8.844584226608276e-05, 9.179115295410156e-05, 9.513646364212036e-05, 9.848177433013916e-05, 0.00010182708501815796, 0.00010517239570617676, 0.00010851770639419556, 0.00011186301708221436, 0.00011520832777023315, 0.00011855363845825195]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 10.0, 11.0, 11.0, 18.0, 16.0, 30.0, 64.0, 78.0, 168.0, 333.0, 690.0, 1480.0, 4217.0, 16725.0, 162014.0, 745978.0, 98455.0, 12289.0, 3427.0, 1312.0, 516.0, 283.0, 159.0, 94.0, 51.0, 38.0, 29.0, 17.0, 11.0, 9.0, 4.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.177978515625, -0.17192649841308594, -0.16587448120117188, -0.1598224639892578, -0.15377044677734375, -0.1477184295654297, -0.14166641235351562, -0.13561439514160156, -0.1295623779296875, -0.12351036071777344, -0.11745834350585938, -0.11140632629394531, -0.10535430908203125, -0.09930229187011719, -0.09325027465820312, -0.08719825744628906, -0.081146240234375, -0.07509422302246094, -0.06904220581054688, -0.06299018859863281, -0.05693817138671875, -0.05088615417480469, -0.044834136962890625, -0.03878211975097656, -0.0327301025390625, -0.026678085327148438, -0.020626068115234375, -0.014574050903320312, -0.00852203369140625, -0.0024700164794921875, 0.003582000732421875, 0.009634017944335938, 0.01568603515625, 0.021738052368164062, 0.027790069580078125, 0.03384208679199219, 0.03989410400390625, 0.04594612121582031, 0.051998138427734375, 0.05805015563964844, 0.0641021728515625, 0.07015419006347656, 0.07620620727539062, 0.08225822448730469, 0.08831024169921875, 0.09436225891113281, 0.10041427612304688, 0.10646629333496094, 0.112518310546875, 0.11857032775878906, 0.12462234497070312, 0.1306743621826172, 0.13672637939453125, 0.1427783966064453, 0.14883041381835938, 0.15488243103027344, 0.1609344482421875, 0.16698646545410156, 0.17303848266601562, 0.1790904998779297, 0.18514251708984375, 0.1911945343017578, 0.19724655151367188, 0.20329856872558594, 0.2093505859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 15.0, 29.0, 41.0, 89.0, 121.0, 170.0, 171.0, 155.0, 89.0, 50.0, 21.0, 16.0, 4.0, 7.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19970703125, -0.18926239013671875, -0.1788177490234375, -0.16837310791015625, -0.157928466796875, -0.14748382568359375, -0.1370391845703125, -0.12659454345703125, -0.11614990234375, -0.10570526123046875, -0.0952606201171875, -0.08481597900390625, -0.074371337890625, -0.06392669677734375, -0.0534820556640625, -0.04303741455078125, -0.0325927734375, -0.02214813232421875, -0.0117034912109375, -0.00125885009765625, 0.009185791015625, 0.01963043212890625, 0.0300750732421875, 0.04051971435546875, 0.05096435546875, 0.06140899658203125, 0.0718536376953125, 0.08229827880859375, 0.092742919921875, 0.10318756103515625, 0.1136322021484375, 0.12407684326171875, 0.134521484375, 0.14496612548828125, 0.1554107666015625, 0.16585540771484375, 0.176300048828125, 0.18674468994140625, 0.1971893310546875, 0.20763397216796875, 0.21807861328125, 0.22852325439453125, 0.2389678955078125, 0.24941253662109375, 0.259857177734375, 0.27030181884765625, 0.2807464599609375, 0.29119110107421875, 0.3016357421875, 0.31208038330078125, 0.3225250244140625, 0.33296966552734375, 0.343414306640625, 0.35385894775390625, 0.3643035888671875, 0.37474822998046875, 0.38519287109375, 0.39563751220703125, 0.4060821533203125, 0.41652679443359375, 0.426971435546875, 0.43741607666015625, 0.4478607177734375, 0.45830535888671875, 0.46875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 13.0, 20.0, 15.0, 27.0, 42.0, 60.0, 98.0, 138.0, 164.0, 150.0, 116.0, 63.0, 43.0, 19.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9455392360687256, -1.8637481927871704, -1.7819571495056152, -1.7001662254333496, -1.6183751821517944, -1.5365841388702393, -1.4547932147979736, -1.3730021715164185, -1.2912111282348633, -1.209420084953308, -1.127629041671753, -1.0458381175994873, -0.9640470743179321, -0.882256031036377, -0.8004650473594666, -0.7186740636825562, -0.636883020401001, -0.5550919771194458, -0.4733009934425354, -0.3915099799633026, -0.3097189664840698, -0.22792795300483704, -0.14613693952560425, -0.06434595584869385, 0.017445087432861328, 0.09923610091209412, 0.1810271143913269, 0.2628181278705597, 0.3446091413497925, 0.42640015482902527, 0.5081911683082581, 0.5899821519851685, 0.6717734336853027, 0.7535644769668579, 0.8353554606437683, 0.9171464443206787, 0.9989374876022339, 1.080728530883789, 1.1625194549560547, 1.2443104982376099, 1.326101541519165, 1.4078925848007202, 1.4896836280822754, 1.571474552154541, 1.6532655954360962, 1.7350566387176514, 1.816847562789917, 1.8986386060714722, 1.9804296493530273, 2.062220573425293, 2.1440117359161377, 2.2258026599884033, 2.307593822479248, 2.3893847465515137, 2.4711756706237793, 2.552966594696045, 2.6347577571868896, 2.7165486812591553, 2.79833984375, 2.8801307678222656, 2.9619216918945312, 3.043712854385376, 3.1255037784576416, 3.2072949409484863, 3.289085865020752]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 11.0, 2.0, 9.0, 4.0, 13.0, 9.0, 9.0, 16.0, 19.0, 27.0, 27.0, 25.0, 26.0, 42.0, 37.0, 34.0, 53.0, 50.0, 48.0, 52.0, 66.0, 43.0, 33.0, 27.0, 35.0, 31.0, 34.0, 26.0, 28.0, 29.0, 17.0, 18.0, 11.0, 15.0, 16.0, 11.0, 11.0, 5.0, 4.0, 8.0, 10.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.0298027992248535, -2.9452853202819824, -2.8607680797576904, -2.7762506008148193, -2.6917331218719482, -2.607215642929077, -2.522698402404785, -2.438180923461914, -2.353663444519043, -2.269145965576172, -2.18462872505188, -2.100111246109009, -2.0155937671661377, -1.9310764074325562, -1.8465590476989746, -1.7620415687561035, -1.677524209022522, -1.5930068492889404, -1.5084893703460693, -1.4239720106124878, -1.3394545316696167, -1.2549371719360352, -1.170419692993164, -1.0859023332595825, -1.001384973526001, -0.9168675541877747, -0.8323501348495483, -0.7478327751159668, -0.6633152961730957, -0.5787979364395142, -0.49428051710128784, -0.4097630977630615, -0.32524561882019043, -0.2407281994819641, -0.156210795044899, -0.07169339060783386, 0.012824028730392456, 0.09734144806861877, 0.1818588376045227, 0.266376256942749, 0.35089367628097534, 0.43541109561920166, 0.519928514957428, 0.6044459342956543, 0.6889632940292358, 0.7734807729721069, 0.8579981327056885, 0.9425155520439148, 1.0270329713821411, 1.1115503311157227, 1.1960678100585938, 1.2805851697921753, 1.3651026487350464, 1.449620008468628, 1.534137487411499, 1.6186548471450806, 1.703172206878662, 1.7876895666122437, 1.8722070455551147, 1.9567244052886963, 2.0412418842315674, 2.1257593631744385, 2.2102766036987305, 2.2947940826416016, 2.3793115615844727]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 7.0, 9.0, 15.0, 16.0, 30.0, 46.0, 95.0, 160.0, 292.0, 633.0, 1792.0, 7861.0, 4082732.0, 93825.0, 4436.0, 1244.0, 515.0, 242.0, 132.0, 64.0, 42.0, 23.0, 16.0, 14.0, 11.0, 6.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67578125, -0.6474456787109375, -0.619110107421875, -0.5907745361328125, -0.56243896484375, -0.5341033935546875, -0.505767822265625, -0.4774322509765625, -0.4490966796875, -0.4207611083984375, -0.392425537109375, -0.3640899658203125, -0.33575439453125, -0.3074188232421875, -0.279083251953125, -0.2507476806640625, -0.222412109375, -0.1940765380859375, -0.165740966796875, -0.1374053955078125, -0.10906982421875, -0.0807342529296875, -0.052398681640625, -0.0240631103515625, 0.0042724609375, 0.0326080322265625, 0.060943603515625, 0.0892791748046875, 0.11761474609375, 0.1459503173828125, 0.174285888671875, 0.2026214599609375, 0.23095703125, 0.2592926025390625, 0.287628173828125, 0.3159637451171875, 0.34429931640625, 0.3726348876953125, 0.400970458984375, 0.4293060302734375, 0.4576416015625, 0.4859771728515625, 0.514312744140625, 0.5426483154296875, 0.57098388671875, 0.5993194580078125, 0.627655029296875, 0.6559906005859375, 0.684326171875, 0.7126617431640625, 0.740997314453125, 0.7693328857421875, 0.79766845703125, 0.8260040283203125, 0.854339599609375, 0.8826751708984375, 0.9110107421875, 0.9393463134765625, 0.967681884765625, 0.9960174560546875, 1.02435302734375, 1.0526885986328125, 1.081024169921875, 1.1093597412109375, 1.1376953125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 10.0, 12.0, 18.0, 16.0, 31.0, 30.0, 33.0, 30.0, 58.0, 58.0, 58.0, 64.0, 49.0, 71.0, 61.0, 68.0, 52.0, 45.0, 44.0, 28.0, 23.0, 25.0, 25.0, 20.0, 10.0, 16.0, 11.0, 6.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2269287109375, -0.2207965850830078, -0.21466445922851562, -0.20853233337402344, -0.20240020751953125, -0.19626808166503906, -0.19013595581054688, -0.1840038299560547, -0.1778717041015625, -0.1717395782470703, -0.16560745239257812, -0.15947532653808594, -0.15334320068359375, -0.14721107482910156, -0.14107894897460938, -0.1349468231201172, -0.128814697265625, -0.12268257141113281, -0.11655044555664062, -0.11041831970214844, -0.10428619384765625, -0.09815406799316406, -0.09202194213867188, -0.08588981628417969, -0.0797576904296875, -0.07362556457519531, -0.06749343872070312, -0.06136131286621094, -0.05522918701171875, -0.04909706115722656, -0.042964935302734375, -0.03683280944824219, -0.03070068359375, -0.024568557739257812, -0.018436431884765625, -0.012304306030273438, -0.00617218017578125, -4.00543212890625e-05, 0.006092071533203125, 0.012224197387695312, 0.0183563232421875, 0.024488449096679688, 0.030620574951171875, 0.03675270080566406, 0.04288482666015625, 0.04901695251464844, 0.055149078369140625, 0.06128120422363281, 0.067413330078125, 0.07354545593261719, 0.07967758178710938, 0.08580970764160156, 0.09194183349609375, 0.09807395935058594, 0.10420608520507812, 0.11033821105957031, 0.1164703369140625, 0.12260246276855469, 0.12873458862304688, 0.13486671447753906, 0.14099884033203125, 0.14713096618652344, 0.15326309204101562, 0.1593952178955078, 0.16552734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 7.0, 1.0, 5.0, 4.0, 11.0, 13.0, 18.0, 22.0, 24.0, 31.0, 38.0, 54.0, 99.0, 148.0, 239.0, 399.0, 724.0, 1280.0, 2787.0, 7816.0, 50247.0, 4061356.0, 54675.0, 8155.0, 2907.0, 1311.0, 702.0, 389.0, 265.0, 143.0, 100.0, 76.0, 58.0, 41.0, 26.0, 27.0, 19.0, 16.0, 8.0, 7.0, 5.0, 2.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.429931640625, -0.416290283203125, -0.40264892578125, -0.389007568359375, -0.3753662109375, -0.361724853515625, -0.34808349609375, -0.334442138671875, -0.32080078125, -0.307159423828125, -0.29351806640625, -0.279876708984375, -0.2662353515625, -0.252593994140625, -0.23895263671875, -0.225311279296875, -0.211669921875, -0.198028564453125, -0.18438720703125, -0.170745849609375, -0.1571044921875, -0.143463134765625, -0.12982177734375, -0.116180419921875, -0.1025390625, -0.088897705078125, -0.07525634765625, -0.061614990234375, -0.0479736328125, -0.034332275390625, -0.02069091796875, -0.007049560546875, 0.006591796875, 0.020233154296875, 0.03387451171875, 0.047515869140625, 0.0611572265625, 0.074798583984375, 0.08843994140625, 0.102081298828125, 0.11572265625, 0.129364013671875, 0.14300537109375, 0.156646728515625, 0.1702880859375, 0.183929443359375, 0.19757080078125, 0.211212158203125, 0.224853515625, 0.238494873046875, 0.25213623046875, 0.265777587890625, 0.2794189453125, 0.293060302734375, 0.30670166015625, 0.320343017578125, 0.333984375, 0.347625732421875, 0.36126708984375, 0.374908447265625, 0.3885498046875, 0.402191162109375, 0.41583251953125, 0.429473876953125, 0.443115234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 1.0, 2.0, 14.0, 25.0, 80.0, 3577.0, 289.0, 49.0, 26.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.26122188568115234, -0.2551097869873047, -0.24899768829345703, -0.24288558959960938, -0.23677349090576172, -0.23066139221191406, -0.2245492935180664, -0.21843719482421875, -0.2123250961303711, -0.20621299743652344, -0.20010089874267578, -0.19398880004882812, -0.18787670135498047, -0.1817646026611328, -0.17565250396728516, -0.1695404052734375, -0.16342830657958984, -0.1573162078857422, -0.15120410919189453, -0.14509201049804688, -0.13897991180419922, -0.13286781311035156, -0.1267557144165039, -0.12064361572265625, -0.1145315170288086, -0.10841941833496094, -0.10230731964111328, -0.09619522094726562, -0.09008312225341797, -0.08397102355957031, -0.07785892486572266, -0.071746826171875, -0.06563472747802734, -0.05952262878417969, -0.05341053009033203, -0.047298431396484375, -0.04118633270263672, -0.03507423400878906, -0.028962135314941406, -0.02285003662109375, -0.016737937927246094, -0.010625839233398438, -0.004513740539550781, 0.001598358154296875, 0.007710456848144531, 0.013822555541992188, 0.019934654235839844, 0.0260467529296875, 0.032158851623535156, 0.03827095031738281, 0.04438304901123047, 0.050495147705078125, 0.05660724639892578, 0.06271934509277344, 0.0688314437866211, 0.07494354248046875, 0.0810556411743164, 0.08716773986816406, 0.09327983856201172, 0.09939193725585938, 0.10550403594970703, 0.11161613464355469, 0.11772823333740234, 0.12384033203125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 20.0, 48.0, 71.0, 124.0, 163.0, 176.0, 147.0, 109.0, 65.0, 34.0, 15.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5215672254562378, -0.508392333984375, -0.495217502117157, -0.4820426106452942, -0.4688677489757538, -0.4556928873062134, -0.4425179958343506, -0.4293431341648102, -0.4161682724952698, -0.40299341082572937, -0.38981854915618896, -0.37664365768432617, -0.36346879601478577, -0.35029393434524536, -0.33711904287338257, -0.32394418120384216, -0.31076931953430176, -0.29759445786476135, -0.28441959619522095, -0.27124470472335815, -0.25806984305381775, -0.24489498138427734, -0.23172010481357574, -0.21854522824287415, -0.20537036657333374, -0.19219550490379333, -0.17902062833309174, -0.16584575176239014, -0.15267089009284973, -0.13949602842330933, -0.12632115185260773, -0.11314628273248672, -0.09997141361236572, -0.08679654449224472, -0.07362167537212372, -0.060446806252002716, -0.047271937131881714, -0.03409706801176071, -0.02092219889163971, -0.007747329771518707, 0.005427539348602295, 0.018602408468723297, 0.0317772775888443, 0.0449521467089653, 0.058127015829086304, 0.0713018849492073, 0.08447675406932831, 0.09765162318944931, 0.11082649230957031, 0.12400136142969131, 0.13717623054981232, 0.15035110712051392, 0.16352596879005432, 0.17670083045959473, 0.18987570703029633, 0.20305058360099792, 0.21622544527053833, 0.22940030694007874, 0.24257518351078033, 0.25575006008148193, 0.26892492175102234, 0.28209978342056274, 0.29527467489242554, 0.30844953656196594, 0.32162439823150635]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 6.0, 11.0, 10.0, 16.0, 12.0, 26.0, 18.0, 21.0, 24.0, 23.0, 37.0, 41.0, 43.0, 43.0, 42.0, 40.0, 52.0, 46.0, 51.0, 49.0, 50.0, 42.0, 38.0, 45.0, 30.0, 28.0, 30.0, 28.0, 16.0, 19.0, 12.0, 12.0, 9.0, 5.0, 1.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22378134727478027, -0.21661347150802612, -0.20944559574127197, -0.20227771997451782, -0.19510984420776367, -0.18794196844100952, -0.18077409267425537, -0.17360621690750122, -0.16643834114074707, -0.15927046537399292, -0.15210258960723877, -0.14493471384048462, -0.13776683807373047, -0.13059896230697632, -0.12343109399080276, -0.11626321822404861, -0.10909534990787506, -0.10192747414112091, -0.09475959837436676, -0.08759172260761261, -0.08042384684085846, -0.07325597107410431, -0.06608810275793076, -0.058920226991176605, -0.051752351224422455, -0.044584475457668304, -0.037416599690914154, -0.030248727649450302, -0.02308085188269615, -0.015912976115942, -0.00874510407447815, -0.001577228307723999, 0.005590647459030151, 0.012758522294461727, 0.019926397129893303, 0.027094271034002304, 0.034262146800756454, 0.041430022567510605, 0.04859789460897446, 0.05576577037572861, 0.06293364614248276, 0.07010152190923691, 0.07726939767599106, 0.08443726599216461, 0.09160514175891876, 0.09877301752567291, 0.10594089329242706, 0.11310876905918121, 0.12027664482593536, 0.12744452059268951, 0.13461239635944366, 0.14178027212619781, 0.14894814789295197, 0.15611602365970612, 0.16328388452529907, 0.17045176029205322, 0.17761963605880737, 0.18478751182556152, 0.19195538759231567, 0.19912326335906982, 0.20629113912582397, 0.21345901489257812, 0.22062689065933228, 0.22779476642608643, 0.23496264219284058]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 5.0, 16.0, 16.0, 26.0, 41.0, 63.0, 114.0, 187.0, 332.0, 721.0, 1794.0, 5629.0, 26799.0, 197356.0, 629659.0, 155930.0, 21931.0, 4942.0, 1533.0, 637.0, 340.0, 190.0, 96.0, 69.0, 44.0, 21.0, 22.0, 15.0, 6.0, 3.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291015625, -0.27860260009765625, -0.2661895751953125, -0.25377655029296875, -0.241363525390625, -0.22895050048828125, -0.2165374755859375, -0.20412445068359375, -0.19171142578125, -0.17929840087890625, -0.1668853759765625, -0.15447235107421875, -0.142059326171875, -0.12964630126953125, -0.1172332763671875, -0.10482025146484375, -0.0924072265625, -0.07999420166015625, -0.0675811767578125, -0.05516815185546875, -0.042755126953125, -0.03034210205078125, -0.0179290771484375, -0.00551605224609375, 0.00689697265625, 0.01930999755859375, 0.0317230224609375, 0.04413604736328125, 0.056549072265625, 0.06896209716796875, 0.0813751220703125, 0.09378814697265625, 0.106201171875, 0.11861419677734375, 0.1310272216796875, 0.14344024658203125, 0.155853271484375, 0.16826629638671875, 0.1806793212890625, 0.19309234619140625, 0.20550537109375, 0.21791839599609375, 0.2303314208984375, 0.24274444580078125, 0.255157470703125, 0.26757049560546875, 0.2799835205078125, 0.29239654541015625, 0.3048095703125, 0.31722259521484375, 0.3296356201171875, 0.34204864501953125, 0.354461669921875, 0.36687469482421875, 0.3792877197265625, 0.39170074462890625, 0.40411376953125, 0.41652679443359375, 0.4289398193359375, 0.44135284423828125, 0.453765869140625, 0.46617889404296875, 0.4785919189453125, 0.49100494384765625, 0.50341796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 9.0, 14.0, 14.0, 17.0, 23.0, 34.0, 30.0, 43.0, 34.0, 47.0, 47.0, 62.0, 58.0, 62.0, 76.0, 68.0, 50.0, 47.0, 39.0, 39.0, 33.0, 22.0, 24.0, 26.0, 16.0, 15.0, 13.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.22509765625, -0.21892738342285156, -0.21275711059570312, -0.2065868377685547, -0.20041656494140625, -0.1942462921142578, -0.18807601928710938, -0.18190574645996094, -0.1757354736328125, -0.16956520080566406, -0.16339492797851562, -0.1572246551513672, -0.15105438232421875, -0.1448841094970703, -0.13871383666992188, -0.13254356384277344, -0.126373291015625, -0.12020301818847656, -0.11403274536132812, -0.10786247253417969, -0.10169219970703125, -0.09552192687988281, -0.08935165405273438, -0.08318138122558594, -0.0770111083984375, -0.07084083557128906, -0.06467056274414062, -0.05850028991699219, -0.05233001708984375, -0.04615974426269531, -0.039989471435546875, -0.03381919860839844, -0.02764892578125, -0.021478652954101562, -0.015308380126953125, -0.009138107299804688, -0.00296783447265625, 0.0032024383544921875, 0.009372711181640625, 0.015542984008789062, 0.0217132568359375, 0.027883529663085938, 0.034053802490234375, 0.04022407531738281, 0.04639434814453125, 0.05256462097167969, 0.058734893798828125, 0.06490516662597656, 0.071075439453125, 0.07724571228027344, 0.08341598510742188, 0.08958625793457031, 0.09575653076171875, 0.10192680358886719, 0.10809707641601562, 0.11426734924316406, 0.1204376220703125, 0.12660789489746094, 0.13277816772460938, 0.1389484405517578, 0.14511871337890625, 0.1512889862060547, 0.15745925903320312, 0.16362953186035156, 0.1697998046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 10.0, 6.0, 12.0, 13.0, 24.0, 27.0, 45.0, 87.0, 142.0, 257.0, 412.0, 932.0, 2305.0, 7677.0, 80388.0, 859631.0, 84587.0, 7812.0, 2300.0, 890.0, 433.0, 226.0, 124.0, 83.0, 47.0, 25.0, 13.0, 21.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5278701782226562, -0.5093536376953125, -0.49083709716796875, -0.472320556640625, -0.45380401611328125, -0.4352874755859375, -0.41677093505859375, -0.39825439453125, -0.37973785400390625, -0.3612213134765625, -0.34270477294921875, -0.324188232421875, -0.30567169189453125, -0.2871551513671875, -0.26863861083984375, -0.2501220703125, -0.23160552978515625, -0.2130889892578125, -0.19457244873046875, -0.176055908203125, -0.15753936767578125, -0.1390228271484375, -0.12050628662109375, -0.10198974609375, -0.08347320556640625, -0.0649566650390625, -0.04644012451171875, -0.027923583984375, -0.00940704345703125, 0.0091094970703125, 0.02762603759765625, 0.046142578125, 0.06465911865234375, 0.0831756591796875, 0.10169219970703125, 0.120208740234375, 0.13872528076171875, 0.1572418212890625, 0.17575836181640625, 0.19427490234375, 0.21279144287109375, 0.2313079833984375, 0.24982452392578125, 0.268341064453125, 0.28685760498046875, 0.3053741455078125, 0.32389068603515625, 0.3424072265625, 0.36092376708984375, 0.3794403076171875, 0.39795684814453125, 0.416473388671875, 0.43498992919921875, 0.4535064697265625, 0.47202301025390625, 0.49053955078125, 0.5090560913085938, 0.5275726318359375, 0.5460891723632812, 0.564605712890625, 0.5831222534179688, 0.6016387939453125, 0.6201553344726562, 0.638671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 16.0, 17.0, 16.0, 45.0, 62.0, 73.0, 107.0, 126.0, 95.0, 96.0, 97.0, 81.0, 71.0, 42.0, 13.0, 13.0, 6.0, 8.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2679290771484375, -1.216522216796875, -1.1651153564453125, -1.11370849609375, -1.0623016357421875, -1.010894775390625, -0.9594879150390625, -0.9080810546875, -0.8566741943359375, -0.805267333984375, -0.7538604736328125, -0.70245361328125, -0.6510467529296875, -0.599639892578125, -0.5482330322265625, -0.496826171875, -0.4454193115234375, -0.394012451171875, -0.3426055908203125, -0.29119873046875, -0.2397918701171875, -0.188385009765625, -0.1369781494140625, -0.0855712890625, -0.0341644287109375, 0.017242431640625, 0.0686492919921875, 0.12005615234375, 0.1714630126953125, 0.222869873046875, 0.2742767333984375, 0.32568359375, 0.3770904541015625, 0.428497314453125, 0.4799041748046875, 0.53131103515625, 0.5827178955078125, 0.634124755859375, 0.6855316162109375, 0.7369384765625, 0.7883453369140625, 0.839752197265625, 0.8911590576171875, 0.94256591796875, 0.9939727783203125, 1.045379638671875, 1.0967864990234375, 1.148193359375, 1.1996002197265625, 1.251007080078125, 1.3024139404296875, 1.35382080078125, 1.4052276611328125, 1.456634521484375, 1.5080413818359375, 1.5594482421875, 1.6108551025390625, 1.662261962890625, 1.7136688232421875, 1.76507568359375, 1.8164825439453125, 1.867889404296875, 1.9192962646484375, 1.970703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 9.0, 10.0, 33.0, 44.0, 199.0, 1083.0, 972378.0, 73845.0, 696.0, 157.0, 52.0, 15.0, 9.0, 12.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -0.982269287109375, -0.92742919921875, -0.872589111328125, -0.8177490234375, -0.762908935546875, -0.70806884765625, -0.653228759765625, -0.598388671875, -0.543548583984375, -0.48870849609375, -0.433868408203125, -0.3790283203125, -0.324188232421875, -0.26934814453125, -0.214508056640625, -0.15966796875, -0.104827880859375, -0.04998779296875, 0.004852294921875, 0.0596923828125, 0.114532470703125, 0.16937255859375, 0.224212646484375, 0.279052734375, 0.333892822265625, 0.38873291015625, 0.443572998046875, 0.4984130859375, 0.553253173828125, 0.60809326171875, 0.662933349609375, 0.7177734375, 0.772613525390625, 0.82745361328125, 0.882293701171875, 0.9371337890625, 0.991973876953125, 1.04681396484375, 1.101654052734375, 1.156494140625, 1.211334228515625, 1.26617431640625, 1.321014404296875, 1.3758544921875, 1.430694580078125, 1.48553466796875, 1.540374755859375, 1.59521484375, 1.650054931640625, 1.70489501953125, 1.759735107421875, 1.8145751953125, 1.869415283203125, 1.92425537109375, 1.979095458984375, 2.033935546875, 2.088775634765625, 2.14361572265625, 2.198455810546875, 2.2532958984375, 2.308135986328125, 2.36297607421875, 2.417816162109375, 2.47265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 6.0, 6.0, 14.0, 16.0, 19.0, 25.0, 30.0, 44.0, 48.0, 75.0, 76.0, 101.0, 79.0, 92.0, 70.0, 67.0, 53.0, 21.0, 29.0, 27.0, 21.0, 13.0, 11.0, 10.0, 7.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.368492126464844e-05, -8.103344589471817e-05, -7.83819705247879e-05, -7.573049515485764e-05, -7.307901978492737e-05, -7.04275444149971e-05, -6.777606904506683e-05, -6.512459367513657e-05, -6.24731183052063e-05, -5.982164293527603e-05, -5.7170167565345764e-05, -5.45186921954155e-05, -5.186721682548523e-05, -4.921574145555496e-05, -4.6564266085624695e-05, -4.391279071569443e-05, -4.126131534576416e-05, -3.860983997583389e-05, -3.5958364605903625e-05, -3.330688923597336e-05, -3.065541386604309e-05, -2.8003938496112823e-05, -2.5352463126182556e-05, -2.270098775625229e-05, -2.004951238632202e-05, -1.7398037016391754e-05, -1.4746561646461487e-05, -1.209508627653122e-05, -9.443610906600952e-06, -6.792135536670685e-06, -4.1406601667404175e-06, -1.4891847968101501e-06, 1.1622905731201172e-06, 3.8137659430503845e-06, 6.465241312980652e-06, 9.11671668291092e-06, 1.1768192052841187e-05, 1.4419667422771454e-05, 1.707114279270172e-05, 1.972261816263199e-05, 2.2374093532562256e-05, 2.5025568902492523e-05, 2.767704427242279e-05, 3.0328519642353058e-05, 3.2979995012283325e-05, 3.563147038221359e-05, 3.828294575214386e-05, 4.093442112207413e-05, 4.3585896492004395e-05, 4.623737186193466e-05, 4.888884723186493e-05, 5.1540322601795197e-05, 5.4191797971725464e-05, 5.684327334165573e-05, 5.9494748711586e-05, 6.214622408151627e-05, 6.479769945144653e-05, 6.74491748213768e-05, 7.010065019130707e-05, 7.275212556123734e-05, 7.54036009311676e-05, 7.805507630109787e-05, 8.070655167102814e-05, 8.33580270409584e-05, 8.600950241088867e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 15.0, 35.0, 42.0, 92.0, 184.0, 411.0, 1606.0, 14714.0, 1006623.0, 22033.0, 1913.0, 473.0, 172.0, 99.0, 51.0, 28.0, 18.0, 10.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.6323318481445312, -0.6093902587890625, -0.5864486694335938, -0.563507080078125, -0.5405654907226562, -0.5176239013671875, -0.49468231201171875, -0.47174072265625, -0.44879913330078125, -0.4258575439453125, -0.40291595458984375, -0.379974365234375, -0.35703277587890625, -0.3340911865234375, -0.31114959716796875, -0.2882080078125, -0.26526641845703125, -0.2423248291015625, -0.21938323974609375, -0.196441650390625, -0.17350006103515625, -0.1505584716796875, -0.12761688232421875, -0.10467529296875, -0.08173370361328125, -0.0587921142578125, -0.03585052490234375, -0.012908935546875, 0.01003265380859375, 0.0329742431640625, 0.05591583251953125, 0.078857421875, 0.10179901123046875, 0.1247406005859375, 0.14768218994140625, 0.170623779296875, 0.19356536865234375, 0.2165069580078125, 0.23944854736328125, 0.26239013671875, 0.28533172607421875, 0.3082733154296875, 0.33121490478515625, 0.354156494140625, 0.37709808349609375, 0.4000396728515625, 0.42298126220703125, 0.4459228515625, 0.46886444091796875, 0.4918060302734375, 0.5147476196289062, 0.537689208984375, 0.5606307983398438, 0.5835723876953125, 0.6065139770507812, 0.62945556640625, 0.6523971557617188, 0.6753387451171875, 0.6982803344726562, 0.721221923828125, 0.7441635131835938, 0.7671051025390625, 0.7900466918945312, 0.81298828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 6.0, 9.0, 18.0, 117.0, 447.0, 318.0, 51.0, 11.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5386962890625, -1.505126953125, -1.4715576171875, -1.43798828125, -1.4044189453125, -1.370849609375, -1.3372802734375, -1.3037109375, -1.2701416015625, -1.236572265625, -1.2030029296875, -1.16943359375, -1.1358642578125, -1.102294921875, -1.0687255859375, -1.03515625, -1.0015869140625, -0.968017578125, -0.9344482421875, -0.90087890625, -0.8673095703125, -0.833740234375, -0.8001708984375, -0.7666015625, -0.7330322265625, -0.699462890625, -0.6658935546875, -0.63232421875, -0.5987548828125, -0.565185546875, -0.5316162109375, -0.498046875, -0.4644775390625, -0.430908203125, -0.3973388671875, -0.36376953125, -0.3302001953125, -0.296630859375, -0.2630615234375, -0.2294921875, -0.1959228515625, -0.162353515625, -0.1287841796875, -0.09521484375, -0.0616455078125, -0.028076171875, 0.0054931640625, 0.0390625, 0.0726318359375, 0.106201171875, 0.1397705078125, 0.17333984375, 0.2069091796875, 0.240478515625, 0.2740478515625, 0.3076171875, 0.3411865234375, 0.374755859375, 0.4083251953125, 0.44189453125, 0.4754638671875, 0.509033203125, 0.5426025390625, 0.576171875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 19.0, 41.0, 177.0, 535.0, 190.0, 20.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.39830780029297, -21.948360443115234, -21.4984130859375, -21.0484676361084, -20.598520278930664, -20.14857292175293, -19.698625564575195, -19.248680114746094, -18.79873275756836, -18.348785400390625, -17.89883804321289, -17.44889259338379, -16.998945236206055, -16.54899787902832, -16.099050521850586, -15.649104118347168, -15.199156761169434, -14.7492094039917, -14.299263000488281, -13.849315643310547, -13.399369239807129, -12.949421882629395, -12.499475479125977, -12.049528121948242, -11.599580764770508, -11.149633407592773, -10.699687004089355, -10.249739646911621, -9.799793243408203, -9.349845886230469, -8.899898529052734, -8.449952125549316, -8.000005722045898, -7.550058841705322, -7.100111961364746, -6.650164604187012, -6.200218200683594, -5.750270843505859, -5.300323963165283, -4.850377082824707, -4.400430202484131, -3.9504833221435547, -3.5005364418029785, -3.0505893230438232, -2.600642442703247, -2.150695562362671, -1.7007484436035156, -1.2508015632629395, -0.8008546829223633, -0.35090774297714233, 0.09903919696807861, 0.5489861965179443, 0.9989330768585205, 1.4488799571990967, 1.898827075958252, 2.348773956298828, 2.7987208366394043, 3.2486677169799805, 3.6986145973205566, 4.148561477661133, 4.598508834838867, 5.048455238342285, 5.4984025955200195, 5.948349475860596, 6.398296356201172]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 9.0, 7.0, 6.0, 12.0, 8.0, 17.0, 17.0, 16.0, 20.0, 23.0, 26.0, 28.0, 32.0, 32.0, 37.0, 42.0, 44.0, 53.0, 45.0, 45.0, 53.0, 43.0, 42.0, 31.0, 37.0, 26.0, 29.0, 38.0, 29.0, 22.0, 25.0, 16.0, 13.0, 11.0, 11.0, 13.0, 15.0, 2.0, 1.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.7863407135009766, -3.668015480041504, -3.5496902465820312, -3.4313650131225586, -3.313039779663086, -3.1947145462036133, -3.0763893127441406, -2.958064079284668, -2.8397388458251953, -2.7214136123657227, -2.60308837890625, -2.4847631454467773, -2.3664379119873047, -2.248112678527832, -2.1297874450683594, -2.0114622116088867, -1.8931372165679932, -1.7748119831085205, -1.6564867496490479, -1.5381615161895752, -1.4198362827301025, -1.3015110492706299, -1.1831859350204468, -1.0648607015609741, -0.9465354681015015, -0.8282102346420288, -0.7098850011825562, -0.5915598273277283, -0.4732345938682556, -0.35490936040878296, -0.23658418655395508, -0.11825895309448242, 6.604194641113281e-05, 0.1183912605047226, 0.23671647906303406, 0.3550416827201843, 0.473366916179657, 0.5916921496391296, 0.7100173234939575, 0.8283425569534302, 0.9466677904129028, 1.0649930238723755, 1.1833182573318481, 1.3016433715820312, 1.419968605041504, 1.5382938385009766, 1.6566190719604492, 1.7749443054199219, 1.8932695388793945, 2.011594772338867, 2.12992000579834, 2.2482452392578125, 2.366570472717285, 2.484895706176758, 2.6032209396362305, 2.721546173095703, 2.839871406555176, 2.9581966400146484, 3.076521873474121, 3.1948471069335938, 3.3131723403930664, 3.431497573852539, 3.5498228073120117, 3.6681480407714844, 3.786473035812378]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 14.0, 21.0, 46.0, 84.0, 194.0, 534.0, 1476.0, 8628.0, 4133710.0, 45410.0, 2831.0, 779.0, 285.0, 120.0, 53.0, 32.0, 22.0, 17.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.83453369140625, -0.8082275390625, -0.78192138671875, -0.755615234375, -0.72930908203125, -0.7030029296875, -0.67669677734375, -0.650390625, -0.62408447265625, -0.5977783203125, -0.57147216796875, -0.545166015625, -0.51885986328125, -0.4925537109375, -0.46624755859375, -0.43994140625, -0.41363525390625, -0.3873291015625, -0.36102294921875, -0.334716796875, -0.30841064453125, -0.2821044921875, -0.25579833984375, -0.2294921875, -0.20318603515625, -0.1768798828125, -0.15057373046875, -0.124267578125, -0.09796142578125, -0.0716552734375, -0.04534912109375, -0.01904296875, 0.00726318359375, 0.0335693359375, 0.05987548828125, 0.086181640625, 0.11248779296875, 0.1387939453125, 0.16510009765625, 0.19140625, 0.21771240234375, 0.2440185546875, 0.27032470703125, 0.296630859375, 0.32293701171875, 0.3492431640625, 0.37554931640625, 0.40185546875, 0.42816162109375, 0.4544677734375, 0.48077392578125, 0.507080078125, 0.53338623046875, 0.5596923828125, 0.58599853515625, 0.6123046875, 0.63861083984375, 0.6649169921875, 0.69122314453125, 0.717529296875, 0.74383544921875, 0.7701416015625, 0.79644775390625, 0.82275390625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 2.0, 11.0, 11.0, 12.0, 10.0, 17.0, 24.0, 24.0, 25.0, 25.0, 37.0, 49.0, 41.0, 44.0, 61.0, 51.0, 65.0, 68.0, 57.0, 67.0, 45.0, 46.0, 30.0, 28.0, 27.0, 19.0, 16.0, 7.0, 13.0, 6.0, 7.0, 11.0, 5.0, 6.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.229248046875, -0.22238922119140625, -0.2155303955078125, -0.20867156982421875, -0.201812744140625, -0.19495391845703125, -0.1880950927734375, -0.18123626708984375, -0.17437744140625, -0.16751861572265625, -0.1606597900390625, -0.15380096435546875, -0.146942138671875, -0.14008331298828125, -0.1332244873046875, -0.12636566162109375, -0.1195068359375, -0.11264801025390625, -0.1057891845703125, -0.09893035888671875, -0.092071533203125, -0.08521270751953125, -0.0783538818359375, -0.07149505615234375, -0.06463623046875, -0.05777740478515625, -0.0509185791015625, -0.04405975341796875, -0.037200927734375, -0.03034210205078125, -0.0234832763671875, -0.01662445068359375, -0.009765625, -0.00290679931640625, 0.0039520263671875, 0.01081085205078125, 0.017669677734375, 0.02452850341796875, 0.0313873291015625, 0.03824615478515625, 0.04510498046875, 0.05196380615234375, 0.0588226318359375, 0.06568145751953125, 0.072540283203125, 0.07939910888671875, 0.0862579345703125, 0.09311676025390625, 0.0999755859375, 0.10683441162109375, 0.1136932373046875, 0.12055206298828125, 0.127410888671875, 0.13426971435546875, 0.1411285400390625, 0.14798736572265625, 0.15484619140625, 0.16170501708984375, 0.1685638427734375, 0.17542266845703125, 0.182281494140625, 0.18914031982421875, 0.1959991455078125, 0.20285797119140625, 0.209716796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 11.0, 19.0, 17.0, 18.0, 33.0, 56.0, 47.0, 68.0, 148.0, 370.0, 1227.0, 11815.0, 4168553.0, 9954.0, 1180.0, 357.0, 113.0, 54.0, 44.0, 51.0, 36.0, 24.0, 18.0, 24.0, 13.0, 9.0, 2.0, 6.0, 1.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.537109375, -1.494964599609375, -1.45281982421875, -1.410675048828125, -1.3685302734375, -1.326385498046875, -1.28424072265625, -1.242095947265625, -1.199951171875, -1.157806396484375, -1.11566162109375, -1.073516845703125, -1.0313720703125, -0.989227294921875, -0.94708251953125, -0.904937744140625, -0.86279296875, -0.820648193359375, -0.77850341796875, -0.736358642578125, -0.6942138671875, -0.652069091796875, -0.60992431640625, -0.567779541015625, -0.525634765625, -0.483489990234375, -0.44134521484375, -0.399200439453125, -0.3570556640625, -0.314910888671875, -0.27276611328125, -0.230621337890625, -0.1884765625, -0.146331787109375, -0.10418701171875, -0.062042236328125, -0.0198974609375, 0.022247314453125, 0.06439208984375, 0.106536865234375, 0.148681640625, 0.190826416015625, 0.23297119140625, 0.275115966796875, 0.3172607421875, 0.359405517578125, 0.40155029296875, 0.443695068359375, 0.48583984375, 0.527984619140625, 0.57012939453125, 0.612274169921875, 0.6544189453125, 0.696563720703125, 0.73870849609375, 0.780853271484375, 0.822998046875, 0.865142822265625, 0.90728759765625, 0.949432373046875, 0.9915771484375, 1.033721923828125, 1.07586669921875, 1.118011474609375, 1.16015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 27.0, 3703.0, 302.0, 34.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1875, -0.175689697265625, -0.16387939453125, -0.152069091796875, -0.1402587890625, -0.128448486328125, -0.11663818359375, -0.104827880859375, -0.093017578125, -0.081207275390625, -0.06939697265625, -0.057586669921875, -0.0457763671875, -0.033966064453125, -0.02215576171875, -0.010345458984375, 0.00146484375, 0.013275146484375, 0.02508544921875, 0.036895751953125, 0.0487060546875, 0.060516357421875, 0.07232666015625, 0.084136962890625, 0.095947265625, 0.107757568359375, 0.11956787109375, 0.131378173828125, 0.1431884765625, 0.154998779296875, 0.16680908203125, 0.178619384765625, 0.1904296875, 0.202239990234375, 0.21405029296875, 0.225860595703125, 0.2376708984375, 0.249481201171875, 0.26129150390625, 0.273101806640625, 0.284912109375, 0.296722412109375, 0.30853271484375, 0.320343017578125, 0.3321533203125, 0.343963623046875, 0.35577392578125, 0.367584228515625, 0.37939453125, 0.391204833984375, 0.40301513671875, 0.414825439453125, 0.4266357421875, 0.438446044921875, 0.45025634765625, 0.462066650390625, 0.473876953125, 0.485687255859375, 0.49749755859375, 0.509307861328125, 0.5211181640625, 0.532928466796875, 0.54473876953125, 0.556549072265625, 0.568359375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 24.0, 291.0, 522.0, 127.0, 21.0, 9.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3711837530136108, -1.3162442445755005, -1.2613046169281006, -1.2063651084899902, -1.1514256000518799, -1.09648597240448, -1.0415464639663696, -0.9866068959236145, -0.9316673278808594, -0.8767277598381042, -0.8217881917953491, -0.7668486833572388, -0.7119091153144836, -0.6569695472717285, -0.6020300388336182, -0.547090470790863, -0.4921509027481079, -0.4372113347053528, -0.38227179646492004, -0.3273322582244873, -0.2723926901817322, -0.21745312213897705, -0.1625135838985443, -0.10757404565811157, -0.052634477615356445, 0.002305075526237488, 0.05724462866783142, 0.11218418180942535, 0.1671237349510193, 0.22206330299377441, 0.27700284123420715, 0.3319423794746399, 0.38688182830810547, 0.4418213963508606, 0.49676093459129333, 0.5517004728317261, 0.6066400408744812, 0.6615796089172363, 0.7165191173553467, 0.7714586853981018, 0.8263982534408569, 0.8813378214836121, 0.9362773895263672, 0.9912168979644775, 1.046156406402588, 1.1010960340499878, 1.1560355424880981, 1.210975170135498, 1.2659146785736084, 1.3208541870117188, 1.3757938146591187, 1.430733323097229, 1.485672950744629, 1.5406124591827393, 1.5955519676208496, 1.65049147605896, 1.7054311037063599, 1.7603706121444702, 1.8153102397918701, 1.8702497482299805, 1.9251892566680908, 1.9801288843154907, 2.0350685119628906, 2.090008020401001, 2.1449475288391113]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 12.0, 11.0, 16.0, 23.0, 26.0, 32.0, 33.0, 39.0, 54.0, 49.0, 64.0, 57.0, 53.0, 52.0, 49.0, 51.0, 67.0, 47.0, 48.0, 44.0, 44.0, 31.0, 19.0, 18.0, 15.0, 15.0, 6.0, 8.0, 1.0, 5.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4719772934913635, -0.45801466703414917, -0.4440520107746124, -0.43008938431739807, -0.41612672805786133, -0.402164101600647, -0.3882014751434326, -0.3742388188838959, -0.36027616262435913, -0.3463135361671448, -0.33235087990760803, -0.3183882534503937, -0.30442559719085693, -0.2904629707336426, -0.2765003442764282, -0.2625376880168915, -0.24857506155967712, -0.23461242020130157, -0.22064977884292603, -0.20668715238571167, -0.19272449612617493, -0.17876186966896057, -0.16479922831058502, -0.15083658695220947, -0.13687394559383392, -0.12291130423545837, -0.10894866287708282, -0.09498602896928787, -0.08102338761091232, -0.06706074625253677, -0.05309811234474182, -0.03913547098636627, -0.025172829627990723, -0.011210190132260323, 0.0027524493634700775, 0.01671508699655533, 0.030677728354930878, 0.04464036971330643, 0.05860300362110138, 0.07256564497947693, 0.08652828633785248, 0.10049092769622803, 0.11445356905460358, 0.12841621041297913, 0.14237883687019348, 0.15634149312973022, 0.17030411958694458, 0.18426676094532013, 0.19822940230369568, 0.21219204366207123, 0.22615468502044678, 0.24011731147766113, 0.2540799677371979, 0.26804259419441223, 0.282005250453949, 0.29596787691116333, 0.3099305033683777, 0.32389312982559204, 0.3378557860851288, 0.35181841254234314, 0.3657810688018799, 0.37974369525909424, 0.3937063217163086, 0.40766897797584534, 0.4216316342353821]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 9.0, 13.0, 12.0, 23.0, 48.0, 59.0, 96.0, 188.0, 267.0, 377.0, 663.0, 1289.0, 2434.0, 4851.0, 10532.0, 25230.0, 69480.0, 214143.0, 404117.0, 203894.0, 66562.0, 24173.0, 10021.0, 4692.0, 2323.0, 1202.0, 733.0, 419.0, 226.0, 155.0, 108.0, 61.0, 49.0, 26.0, 27.0, 14.0, 11.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23779296875, -0.23069000244140625, -0.2235870361328125, -0.21648406982421875, -0.209381103515625, -0.20227813720703125, -0.1951751708984375, -0.18807220458984375, -0.18096923828125, -0.17386627197265625, -0.1667633056640625, -0.15966033935546875, -0.152557373046875, -0.14545440673828125, -0.1383514404296875, -0.13124847412109375, -0.1241455078125, -0.11704254150390625, -0.1099395751953125, -0.10283660888671875, -0.095733642578125, -0.08863067626953125, -0.0815277099609375, -0.07442474365234375, -0.06732177734375, -0.06021881103515625, -0.0531158447265625, -0.04601287841796875, -0.038909912109375, -0.03180694580078125, -0.0247039794921875, -0.01760101318359375, -0.010498046875, -0.00339508056640625, 0.0037078857421875, 0.01081085205078125, 0.017913818359375, 0.02501678466796875, 0.0321197509765625, 0.03922271728515625, 0.04632568359375, 0.05342864990234375, 0.0605316162109375, 0.06763458251953125, 0.074737548828125, 0.08184051513671875, 0.0889434814453125, 0.09604644775390625, 0.1031494140625, 0.11025238037109375, 0.1173553466796875, 0.12445831298828125, 0.131561279296875, 0.13866424560546875, 0.1457672119140625, 0.15287017822265625, 0.15997314453125, 0.16707611083984375, 0.1741790771484375, 0.18128204345703125, 0.188385009765625, 0.19548797607421875, 0.2025909423828125, 0.20969390869140625, 0.216796875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 5.0, 9.0, 6.0, 12.0, 12.0, 15.0, 22.0, 22.0, 28.0, 31.0, 40.0, 42.0, 55.0, 43.0, 41.0, 57.0, 67.0, 66.0, 61.0, 54.0, 45.0, 40.0, 38.0, 40.0, 32.0, 25.0, 12.0, 10.0, 14.0, 13.0, 7.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23095703125, -0.22406387329101562, -0.21717071533203125, -0.21027755737304688, -0.2033843994140625, -0.19649124145507812, -0.18959808349609375, -0.18270492553710938, -0.175811767578125, -0.16891860961914062, -0.16202545166015625, -0.15513229370117188, -0.1482391357421875, -0.14134597778320312, -0.13445281982421875, -0.12755966186523438, -0.12066650390625, -0.11377334594726562, -0.10688018798828125, -0.09998703002929688, -0.0930938720703125, -0.08620071411132812, -0.07930755615234375, -0.07241439819335938, -0.065521240234375, -0.058628082275390625, -0.05173492431640625, -0.044841766357421875, -0.0379486083984375, -0.031055450439453125, -0.02416229248046875, -0.017269134521484375, -0.0103759765625, -0.003482818603515625, 0.00341033935546875, 0.010303497314453125, 0.0171966552734375, 0.024089813232421875, 0.03098297119140625, 0.037876129150390625, 0.044769287109375, 0.051662445068359375, 0.05855560302734375, 0.06544876098632812, 0.0723419189453125, 0.07923507690429688, 0.08612823486328125, 0.09302139282226562, 0.09991455078125, 0.10680770874023438, 0.11370086669921875, 0.12059402465820312, 0.1274871826171875, 0.13438034057617188, 0.14127349853515625, 0.14816665649414062, 0.155059814453125, 0.16195297241210938, 0.16884613037109375, 0.17573928833007812, 0.1826324462890625, 0.18952560424804688, 0.19641876220703125, 0.20331192016601562, 0.210205078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 9.0, 5.0, 10.0, 11.0, 12.0, 25.0, 20.0, 29.0, 39.0, 49.0, 82.0, 103.0, 153.0, 203.0, 325.0, 550.0, 952.0, 1935.0, 5508.0, 23968.0, 221918.0, 693507.0, 79996.0, 12216.0, 3496.0, 1405.0, 732.0, 417.0, 291.0, 176.0, 105.0, 83.0, 40.0, 52.0, 35.0, 29.0, 18.0, 16.0, 13.0, 2.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.42333984375, -0.40981292724609375, -0.3962860107421875, -0.38275909423828125, -0.369232177734375, -0.35570526123046875, -0.3421783447265625, -0.32865142822265625, -0.31512451171875, -0.30159759521484375, -0.2880706787109375, -0.27454376220703125, -0.261016845703125, -0.24748992919921875, -0.2339630126953125, -0.22043609619140625, -0.2069091796875, -0.19338226318359375, -0.1798553466796875, -0.16632843017578125, -0.152801513671875, -0.13927459716796875, -0.1257476806640625, -0.11222076416015625, -0.09869384765625, -0.08516693115234375, -0.0716400146484375, -0.05811309814453125, -0.044586181640625, -0.03105926513671875, -0.0175323486328125, -0.00400543212890625, 0.009521484375, 0.02304840087890625, 0.0365753173828125, 0.05010223388671875, 0.063629150390625, 0.07715606689453125, 0.0906829833984375, 0.10420989990234375, 0.11773681640625, 0.13126373291015625, 0.1447906494140625, 0.15831756591796875, 0.171844482421875, 0.18537139892578125, 0.1988983154296875, 0.21242523193359375, 0.2259521484375, 0.23947906494140625, 0.2530059814453125, 0.26653289794921875, 0.280059814453125, 0.29358673095703125, 0.3071136474609375, 0.32064056396484375, 0.33416748046875, 0.34769439697265625, 0.3612213134765625, 0.37474822998046875, 0.388275146484375, 0.40180206298828125, 0.4153289794921875, 0.42885589599609375, 0.4423828125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 13.0, 7.0, 14.0, 20.0, 14.0, 24.0, 26.0, 26.0, 28.0, 41.0, 38.0, 42.0, 43.0, 55.0, 47.0, 53.0, 41.0, 54.0, 37.0, 42.0, 31.0, 39.0, 39.0, 29.0, 28.0, 31.0, 24.0, 14.0, 18.0, 12.0, 9.0, 11.0, 3.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.994140625, -0.9647750854492188, -0.9354095458984375, -0.9060440063476562, -0.876678466796875, -0.8473129272460938, -0.8179473876953125, -0.7885818481445312, -0.75921630859375, -0.7298507690429688, -0.7004852294921875, -0.6711196899414062, -0.641754150390625, -0.6123886108398438, -0.5830230712890625, -0.5536575317382812, -0.5242919921875, -0.49492645263671875, -0.4655609130859375, -0.43619537353515625, -0.406829833984375, -0.37746429443359375, -0.3480987548828125, -0.31873321533203125, -0.28936767578125, -0.26000213623046875, -0.2306365966796875, -0.20127105712890625, -0.171905517578125, -0.14253997802734375, -0.1131744384765625, -0.08380889892578125, -0.054443359375, -0.02507781982421875, 0.0042877197265625, 0.03365325927734375, 0.063018798828125, 0.09238433837890625, 0.1217498779296875, 0.15111541748046875, 0.18048095703125, 0.20984649658203125, 0.2392120361328125, 0.26857757568359375, 0.297943115234375, 0.32730865478515625, 0.3566741943359375, 0.38603973388671875, 0.4154052734375, 0.44477081298828125, 0.4741363525390625, 0.5035018920898438, 0.532867431640625, 0.5622329711914062, 0.5915985107421875, 0.6209640502929688, 0.65032958984375, 0.6796951293945312, 0.7090606689453125, 0.7384262084960938, 0.767791748046875, 0.7971572875976562, 0.8265228271484375, 0.8558883666992188, 0.88525390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 9.0, 10.0, 28.0, 42.0, 111.0, 512.0, 9398.0, 1029636.0, 8062.0, 554.0, 109.0, 30.0, 18.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.15234375, -1.1238784790039062, -1.0954132080078125, -1.0669479370117188, -1.038482666015625, -1.0100173950195312, -0.9815521240234375, -0.9530868530273438, -0.92462158203125, -0.8961563110351562, -0.8676910400390625, -0.8392257690429688, -0.810760498046875, -0.7822952270507812, -0.7538299560546875, -0.7253646850585938, -0.6968994140625, -0.6684341430664062, -0.6399688720703125, -0.6115036010742188, -0.583038330078125, -0.5545730590820312, -0.5261077880859375, -0.49764251708984375, -0.46917724609375, -0.44071197509765625, -0.4122467041015625, -0.38378143310546875, -0.355316162109375, -0.32685089111328125, -0.2983856201171875, -0.26992034912109375, -0.241455078125, -0.21298980712890625, -0.1845245361328125, -0.15605926513671875, -0.127593994140625, -0.09912872314453125, -0.0706634521484375, -0.04219818115234375, -0.01373291015625, 0.01473236083984375, 0.0431976318359375, 0.07166290283203125, 0.100128173828125, 0.12859344482421875, 0.1570587158203125, 0.18552398681640625, 0.2139892578125, 0.24245452880859375, 0.2709197998046875, 0.29938507080078125, 0.327850341796875, 0.35631561279296875, 0.3847808837890625, 0.41324615478515625, 0.44171142578125, 0.47017669677734375, 0.4986419677734375, 0.5271072387695312, 0.555572509765625, 0.5840377807617188, 0.6125030517578125, 0.6409683227539062, 0.66943359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 8.0, 5.0, 7.0, 8.0, 12.0, 9.0, 10.0, 20.0, 29.0, 31.0, 44.0, 63.0, 75.0, 112.0, 103.0, 109.0, 91.0, 64.0, 41.0, 30.0, 21.0, 15.0, 14.0, 8.0, 11.0, 12.0, 14.0, 3.0, 7.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.341934204101562e-05, -6.103515625e-05, -5.8650970458984375e-05, -5.626678466796875e-05, -5.3882598876953125e-05, -5.14984130859375e-05, -4.9114227294921875e-05, -4.673004150390625e-05, -4.4345855712890625e-05, -4.1961669921875e-05, -3.9577484130859375e-05, -3.719329833984375e-05, -3.4809112548828125e-05, -3.24249267578125e-05, -3.0040740966796875e-05, -2.765655517578125e-05, -2.5272369384765625e-05, -2.288818359375e-05, -2.0503997802734375e-05, -1.811981201171875e-05, -1.5735626220703125e-05, -1.33514404296875e-05, -1.0967254638671875e-05, -8.58306884765625e-06, -6.198883056640625e-06, -3.814697265625e-06, -1.430511474609375e-06, 9.5367431640625e-07, 3.337860107421875e-06, 5.7220458984375e-06, 8.106231689453125e-06, 1.049041748046875e-05, 1.2874603271484375e-05, 1.52587890625e-05, 1.7642974853515625e-05, 2.002716064453125e-05, 2.2411346435546875e-05, 2.47955322265625e-05, 2.7179718017578125e-05, 2.956390380859375e-05, 3.1948089599609375e-05, 3.4332275390625e-05, 3.6716461181640625e-05, 3.910064697265625e-05, 4.1484832763671875e-05, 4.38690185546875e-05, 4.6253204345703125e-05, 4.863739013671875e-05, 5.1021575927734375e-05, 5.340576171875e-05, 5.5789947509765625e-05, 5.817413330078125e-05, 6.0558319091796875e-05, 6.29425048828125e-05, 6.532669067382812e-05, 6.771087646484375e-05, 7.009506225585938e-05, 7.2479248046875e-05, 7.486343383789062e-05, 7.724761962890625e-05, 7.963180541992188e-05, 8.20159912109375e-05, 8.440017700195312e-05, 8.678436279296875e-05, 8.916854858398438e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 7.0, 11.0, 8.0, 11.0, 17.0, 23.0, 38.0, 60.0, 89.0, 143.0, 285.0, 570.0, 1457.0, 4801.0, 31202.0, 691646.0, 296793.0, 16125.0, 3172.0, 1089.0, 427.0, 218.0, 122.0, 76.0, 53.0, 34.0, 25.0, 16.0, 13.0, 5.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.272216796875, -0.2644062042236328, -0.2565956115722656, -0.24878501892089844, -0.24097442626953125, -0.23316383361816406, -0.22535324096679688, -0.2175426483154297, -0.2097320556640625, -0.2019214630126953, -0.19411087036132812, -0.18630027770996094, -0.17848968505859375, -0.17067909240722656, -0.16286849975585938, -0.1550579071044922, -0.147247314453125, -0.1394367218017578, -0.13162612915039062, -0.12381553649902344, -0.11600494384765625, -0.10819435119628906, -0.10038375854492188, -0.09257316589355469, -0.0847625732421875, -0.07695198059082031, -0.06914138793945312, -0.06133079528808594, -0.05352020263671875, -0.04570960998535156, -0.037899017333984375, -0.030088424682617188, -0.02227783203125, -0.014467239379882812, -0.006656646728515625, 0.0011539459228515625, 0.00896453857421875, 0.016775131225585938, 0.024585723876953125, 0.03239631652832031, 0.0402069091796875, 0.04801750183105469, 0.055828094482421875, 0.06363868713378906, 0.07144927978515625, 0.07925987243652344, 0.08707046508789062, 0.09488105773925781, 0.102691650390625, 0.11050224304199219, 0.11831283569335938, 0.12612342834472656, 0.13393402099609375, 0.14174461364746094, 0.14955520629882812, 0.1573657989501953, 0.1651763916015625, 0.1729869842529297, 0.18079757690429688, 0.18860816955566406, 0.19641876220703125, 0.20422935485839844, 0.21203994750976562, 0.2198505401611328, 0.2276611328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 11.0, 37.0, 44.0, 82.0, 107.0, 158.0, 165.0, 127.0, 98.0, 66.0, 25.0, 19.0, 14.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4384765625, -0.4256553649902344, -0.41283416748046875, -0.4000129699707031, -0.3871917724609375, -0.3743705749511719, -0.36154937744140625, -0.3487281799316406, -0.335906982421875, -0.3230857849121094, -0.31026458740234375, -0.2974433898925781, -0.2846221923828125, -0.2718009948730469, -0.25897979736328125, -0.24615859985351562, -0.23333740234375, -0.22051620483398438, -0.20769500732421875, -0.19487380981445312, -0.1820526123046875, -0.16923141479492188, -0.15641021728515625, -0.14358901977539062, -0.130767822265625, -0.11794662475585938, -0.10512542724609375, -0.09230422973632812, -0.0794830322265625, -0.06666183471679688, -0.05384063720703125, -0.041019439697265625, -0.0281982421875, -0.015377044677734375, -0.00255584716796875, 0.010265350341796875, 0.0230865478515625, 0.035907745361328125, 0.04872894287109375, 0.061550140380859375, 0.074371337890625, 0.08719253540039062, 0.10001373291015625, 0.11283493041992188, 0.1256561279296875, 0.13847732543945312, 0.15129852294921875, 0.16411972045898438, 0.17694091796875, 0.18976211547851562, 0.20258331298828125, 0.21540451049804688, 0.2282257080078125, 0.24104690551757812, 0.25386810302734375, 0.2666893005371094, 0.279510498046875, 0.2923316955566406, 0.30515289306640625, 0.3179740905761719, 0.3307952880859375, 0.3436164855957031, 0.35643768310546875, 0.3692588806152344, 0.382080078125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 22.0, 50.0, 150.0, 305.0, 285.0, 135.0, 32.0, 9.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.243878364562988, -7.036629676818848, -6.829380989074707, -6.622132301330566, -6.414883613586426, -6.207634925842285, -6.0003862380981445, -5.793137550354004, -5.585888862609863, -5.378640174865723, -5.171391487121582, -4.964142799377441, -4.756894111633301, -4.54964542388916, -4.3423967361450195, -4.135148048400879, -3.9278995990753174, -3.7206509113311768, -3.513402223587036, -3.3061535358428955, -3.098904848098755, -2.8916563987731934, -2.6844077110290527, -2.477159023284912, -2.2699103355407715, -2.062661647796631, -1.8554129600524902, -1.6481642723083496, -1.440915584564209, -1.233667016029358, -1.0264183282852173, -0.8191696405410767, -0.6119208335876465, -0.40467214584350586, -0.19742348790168762, 0.009825170040130615, 0.21707385778427124, 0.4243224859237671, 0.6315711736679077, 0.8388198614120483, 1.046068549156189, 1.2533172369003296, 1.4605659246444702, 1.6678144931793213, 1.875063180923462, 2.0823118686676025, 2.289560556411743, 2.496809244155884, 2.7040579319000244, 2.911306619644165, 3.1185553073883057, 3.3258039951324463, 3.533052682876587, 3.7403011322021484, 3.947549819946289, 4.15479850769043, 4.36204719543457, 4.569295883178711, 4.776544570922852, 4.983793258666992, 5.191041946411133, 5.398290634155273, 5.605539321899414, 5.812788009643555, 6.020036697387695]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 5.0, 8.0, 8.0, 11.0, 12.0, 9.0, 11.0, 18.0, 24.0, 17.0, 29.0, 23.0, 27.0, 22.0, 37.0, 50.0, 43.0, 42.0, 53.0, 53.0, 42.0, 44.0, 49.0, 47.0, 45.0, 29.0, 27.0, 25.0, 31.0, 24.0, 22.0, 15.0, 17.0, 14.0, 18.0, 6.0, 7.0, 7.0, 4.0, 3.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.311081886291504, -4.176558971405029, -4.042036056518555, -3.90751314163208, -3.7729902267456055, -3.638467311859131, -3.503944158554077, -3.3694212436676025, -3.234898328781128, -3.1003754138946533, -2.9658524990081787, -2.831329584121704, -2.6968064308166504, -2.562283515930176, -2.427760601043701, -2.2932376861572266, -2.158714771270752, -2.0241918563842773, -1.8896689414978027, -1.7551459074020386, -1.620622992515564, -1.4861000776290894, -1.3515770435333252, -1.2170541286468506, -1.082531213760376, -0.9480082988739014, -0.813485324382782, -0.6789623498916626, -0.544439435005188, -0.4099165201187134, -0.275393545627594, -0.1408705711364746, -0.006347179412841797, 0.1281757652759552, 0.2626987099647522, 0.3972216546535492, 0.5317445993423462, 0.6662675142288208, 0.8007904887199402, 0.9353134632110596, 1.0698363780975342, 1.2043592929840088, 1.3388822078704834, 1.4734052419662476, 1.6079281568527222, 1.7424510717391968, 1.876974105834961, 2.0114970207214355, 2.14601993560791, 2.2805428504943848, 2.4150657653808594, 2.549588680267334, 2.6841115951538086, 2.818634510040283, 2.953157663345337, 3.0876805782318115, 3.222203493118286, 3.3567264080047607, 3.4912493228912354, 3.62577223777771, 3.7602953910827637, 3.8948183059692383, 4.029341220855713, 4.1638641357421875, 4.298387050628662]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 9.0, 6.0, 19.0, 21.0, 35.0, 32.0, 70.0, 106.0, 210.0, 407.0, 946.0, 3677.0, 33943.0, 4091754.0, 55981.0, 4798.0, 1211.0, 448.0, 227.0, 133.0, 79.0, 45.0, 37.0, 21.0, 18.0, 7.0, 5.0, 7.0, 4.0, 3.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.480224609375, -0.4614448547363281, -0.44266510009765625, -0.4238853454589844, -0.4051055908203125, -0.3863258361816406, -0.36754608154296875, -0.3487663269042969, -0.329986572265625, -0.3112068176269531, -0.29242706298828125, -0.2736473083496094, -0.2548675537109375, -0.23608779907226562, -0.21730804443359375, -0.19852828979492188, -0.17974853515625, -0.16096878051757812, -0.14218902587890625, -0.12340927124023438, -0.1046295166015625, -0.08584976196289062, -0.06707000732421875, -0.048290252685546875, -0.029510498046875, -0.010730743408203125, 0.00804901123046875, 0.026828765869140625, 0.0456085205078125, 0.06438827514648438, 0.08316802978515625, 0.10194778442382812, 0.1207275390625, 0.13950729370117188, 0.15828704833984375, 0.17706680297851562, 0.1958465576171875, 0.21462631225585938, 0.23340606689453125, 0.2521858215332031, 0.270965576171875, 0.2897453308105469, 0.30852508544921875, 0.3273048400878906, 0.3460845947265625, 0.3648643493652344, 0.38364410400390625, 0.4024238586425781, 0.42120361328125, 0.4399833679199219, 0.45876312255859375, 0.4775428771972656, 0.4963226318359375, 0.5151023864746094, 0.5338821411132812, 0.5526618957519531, 0.571441650390625, 0.5902214050292969, 0.6090011596679688, 0.6277809143066406, 0.6465606689453125, 0.6653404235839844, 0.6841201782226562, 0.7028999328613281, 0.7216796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 10.0, 17.0, 22.0, 16.0, 36.0, 39.0, 52.0, 62.0, 57.0, 74.0, 72.0, 84.0, 84.0, 72.0, 66.0, 52.0, 30.0, 29.0, 21.0, 17.0, 10.0, 15.0, 9.0, 10.0, 4.0, 1.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2939453125, -0.28488922119140625, -0.2758331298828125, -0.26677703857421875, -0.257720947265625, -0.24866485595703125, -0.2396087646484375, -0.23055267333984375, -0.22149658203125, -0.21244049072265625, -0.2033843994140625, -0.19432830810546875, -0.185272216796875, -0.17621612548828125, -0.1671600341796875, -0.15810394287109375, -0.1490478515625, -0.13999176025390625, -0.1309356689453125, -0.12187957763671875, -0.112823486328125, -0.10376739501953125, -0.0947113037109375, -0.08565521240234375, -0.07659912109375, -0.06754302978515625, -0.0584869384765625, -0.04943084716796875, -0.040374755859375, -0.03131866455078125, -0.0222625732421875, -0.01320648193359375, -0.004150390625, 0.00490570068359375, 0.0139617919921875, 0.02301788330078125, 0.032073974609375, 0.04113006591796875, 0.0501861572265625, 0.05924224853515625, 0.06829833984375, 0.07735443115234375, 0.0864105224609375, 0.09546661376953125, 0.104522705078125, 0.11357879638671875, 0.1226348876953125, 0.13169097900390625, 0.1407470703125, 0.14980316162109375, 0.1588592529296875, 0.16791534423828125, 0.176971435546875, 0.18602752685546875, 0.1950836181640625, 0.20413970947265625, 0.21319580078125, 0.22225189208984375, 0.2313079833984375, 0.24036407470703125, 0.249420166015625, 0.25847625732421875, 0.2675323486328125, 0.27658843994140625, 0.28564453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 11.0, 13.0, 17.0, 23.0, 24.0, 37.0, 47.0, 65.0, 92.0, 83.0, 118.0, 125.0, 150.0, 159.0, 206.0, 388.0, 9716.0, 4181005.0, 724.0, 270.0, 182.0, 158.0, 144.0, 92.0, 81.0, 81.0, 66.0, 45.0, 29.0, 22.0, 22.0, 22.0, 17.0, 9.0, 5.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.708984375, -3.597320556640625, -3.48565673828125, -3.373992919921875, -3.2623291015625, -3.150665283203125, -3.03900146484375, -2.927337646484375, -2.815673828125, -2.704010009765625, -2.59234619140625, -2.480682373046875, -2.3690185546875, -2.257354736328125, -2.14569091796875, -2.034027099609375, -1.92236328125, -1.810699462890625, -1.69903564453125, -1.587371826171875, -1.4757080078125, -1.364044189453125, -1.25238037109375, -1.140716552734375, -1.029052734375, -0.917388916015625, -0.80572509765625, -0.694061279296875, -0.5823974609375, -0.470733642578125, -0.35906982421875, -0.247406005859375, -0.1357421875, -0.024078369140625, 0.08758544921875, 0.199249267578125, 0.3109130859375, 0.422576904296875, 0.53424072265625, 0.645904541015625, 0.757568359375, 0.869232177734375, 0.98089599609375, 1.092559814453125, 1.2042236328125, 1.315887451171875, 1.42755126953125, 1.539215087890625, 1.65087890625, 1.762542724609375, 1.87420654296875, 1.985870361328125, 2.0975341796875, 2.209197998046875, 2.32086181640625, 2.432525634765625, 2.544189453125, 2.655853271484375, 2.76751708984375, 2.879180908203125, 2.9908447265625, 3.102508544921875, 3.21417236328125, 3.325836181640625, 3.4375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 249.0, 3829.0, 7.0, 1.0, 0.0, 1.0], "bins": [-4.125, -4.055194854736328, -3.9853897094726562, -3.9155845642089844, -3.8457794189453125, -3.7759742736816406, -3.7061691284179688, -3.636363983154297, -3.566558837890625, -3.496753692626953, -3.4269485473632812, -3.3571434020996094, -3.2873382568359375, -3.2175331115722656, -3.1477279663085938, -3.077922821044922, -3.00811767578125, -2.938312530517578, -2.8685073852539062, -2.7987022399902344, -2.7288970947265625, -2.6590919494628906, -2.5892868041992188, -2.519481658935547, -2.449676513671875, -2.379871368408203, -2.3100662231445312, -2.2402610778808594, -2.1704559326171875, -2.1006507873535156, -2.0308456420898438, -1.9610404968261719, -1.8912353515625, -1.8214302062988281, -1.7516250610351562, -1.6818199157714844, -1.6120147705078125, -1.5422096252441406, -1.4724044799804688, -1.4025993347167969, -1.332794189453125, -1.2629890441894531, -1.1931838989257812, -1.1233787536621094, -1.0535736083984375, -0.9837684631347656, -0.9139633178710938, -0.8441581726074219, -0.77435302734375, -0.7045478820800781, -0.6347427368164062, -0.5649375915527344, -0.4951324462890625, -0.4253273010253906, -0.35552215576171875, -0.2857170104980469, -0.215911865234375, -0.14610671997070312, -0.07630157470703125, -0.006496429443359375, 0.0633087158203125, 0.13311386108398438, 0.20291900634765625, 0.2727241516113281, 0.342529296875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 30.0, 225.0, 634.0, 92.0, 15.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-15.436528205871582, -15.161609649658203, -14.886691093444824, -14.611773490905762, -14.336854934692383, -14.061936378479004, -13.787017822265625, -13.512100219726562, -13.237181663513184, -12.962263107299805, -12.687344551086426, -12.412426948547363, -12.137508392333984, -11.862589836120605, -11.587671279907227, -11.312753677368164, -11.037834167480469, -10.76291561126709, -10.487997055053711, -10.213079452514648, -9.93816089630127, -9.66324234008789, -9.388323783874512, -9.113405227661133, -8.83848762512207, -8.563569068908691, -8.288650512695312, -8.01373291015625, -7.738814353942871, -7.463895797729492, -7.188977241516113, -6.914059162139893, -6.63914155960083, -6.364223003387451, -6.0893049240112305, -5.814386367797852, -5.539468288421631, -5.264549732208252, -4.989631652832031, -4.714713096618652, -4.439794540405273, -4.1648759841918945, -3.889957904815674, -3.615039348602295, -3.340121269226074, -3.0652027130126953, -2.7902843952178955, -2.5153660774230957, -2.240447998046875, -1.9655296802520752, -1.6906113624572754, -1.415692925453186, -1.1407746076583862, -0.8658562898635864, -0.5909378528594971, -0.31601953506469727, -0.04110121726989746, 0.23381713032722473, 0.5087354779243469, 0.7836538553237915, 1.0585721731185913, 1.3334904909133911, 1.6084089279174805, 1.8833272457122803, 2.15824556350708]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 23.0, 25.0, 33.0, 66.0, 78.0, 99.0, 165.0, 153.0, 121.0, 88.0, 45.0, 25.0, 24.0, 17.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.094334602355957, -5.877405166625977, -5.660475730895996, -5.443546295166016, -5.226616859436035, -5.009687423706055, -4.792757987976074, -4.575828552246094, -4.358899116516113, -4.141969680786133, -3.9250402450561523, -3.708110809326172, -3.4911813735961914, -3.274251937866211, -3.0573225021362305, -2.84039306640625, -2.6234633922576904, -2.40653395652771, -2.1896045207977295, -1.972675085067749, -1.7557456493377686, -1.5388160943984985, -1.321886658668518, -1.1049572229385376, -0.8880277872085571, -0.6710983514785767, -0.4541688859462738, -0.23723942041397095, -0.02030998468399048, 0.19661951065063477, 0.41354894638061523, 0.6304783821105957, 0.8474078178405762, 1.0643372535705566, 1.281266689300537, 1.4981961250305176, 1.715125560760498, 1.932055115699768, 2.148984432220459, 2.3659138679504395, 2.58284330368042, 2.7997727394104004, 3.016702175140381, 3.2336316108703613, 3.450561046600342, 3.6674904823303223, 3.8844199180603027, 4.101349353790283, 4.318279266357422, 4.535208702087402, 4.752138137817383, 4.969067573547363, 5.185997009277344, 5.402926445007324, 5.619855880737305, 5.836785316467285, 6.053714752197266, 6.270644187927246, 6.487573623657227, 6.704503059387207, 6.9214324951171875, 7.138361930847168, 7.355291366577148, 7.572220802307129, 7.789150238037109]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 12.0, 15.0, 25.0, 28.0, 53.0, 80.0, 141.0, 256.0, 433.0, 840.0, 2154.0, 6479.0, 27877.0, 233341.0, 677445.0, 78909.0, 13862.0, 3763.0, 1387.0, 622.0, 317.0, 192.0, 116.0, 62.0, 50.0, 22.0, 19.0, 14.0, 8.0, 5.0, 4.0, 0.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.69287109375, -0.6714019775390625, -0.649932861328125, -0.6284637451171875, -0.60699462890625, -0.5855255126953125, -0.564056396484375, -0.5425872802734375, -0.5211181640625, -0.4996490478515625, -0.478179931640625, -0.4567108154296875, -0.43524169921875, -0.4137725830078125, -0.392303466796875, -0.3708343505859375, -0.349365234375, -0.3278961181640625, -0.306427001953125, -0.2849578857421875, -0.26348876953125, -0.2420196533203125, -0.220550537109375, -0.1990814208984375, -0.1776123046875, -0.1561431884765625, -0.134674072265625, -0.1132049560546875, -0.09173583984375, -0.0702667236328125, -0.048797607421875, -0.0273284912109375, -0.005859375, 0.0156097412109375, 0.037078857421875, 0.0585479736328125, 0.08001708984375, 0.1014862060546875, 0.122955322265625, 0.1444244384765625, 0.1658935546875, 0.1873626708984375, 0.208831787109375, 0.2303009033203125, 0.25177001953125, 0.2732391357421875, 0.294708251953125, 0.3161773681640625, 0.337646484375, 0.3591156005859375, 0.380584716796875, 0.4020538330078125, 0.42352294921875, 0.4449920654296875, 0.466461181640625, 0.4879302978515625, 0.5093994140625, 0.5308685302734375, 0.552337646484375, 0.5738067626953125, 0.59527587890625, 0.6167449951171875, 0.638214111328125, 0.6596832275390625, 0.68115234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 4.0, 8.0, 11.0, 8.0, 28.0, 29.0, 32.0, 36.0, 55.0, 63.0, 78.0, 84.0, 92.0, 97.0, 80.0, 71.0, 63.0, 44.0, 31.0, 26.0, 14.0, 12.0, 11.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5005340576171875, -0.483001708984375, -0.4654693603515625, -0.44793701171875, -0.4304046630859375, -0.412872314453125, -0.3953399658203125, -0.3778076171875, -0.3602752685546875, -0.342742919921875, -0.3252105712890625, -0.30767822265625, -0.2901458740234375, -0.272613525390625, -0.2550811767578125, -0.237548828125, -0.2200164794921875, -0.202484130859375, -0.1849517822265625, -0.16741943359375, -0.1498870849609375, -0.132354736328125, -0.1148223876953125, -0.0972900390625, -0.0797576904296875, -0.062225341796875, -0.0446929931640625, -0.02716064453125, -0.0096282958984375, 0.007904052734375, 0.0254364013671875, 0.04296875, 0.0605010986328125, 0.078033447265625, 0.0955657958984375, 0.11309814453125, 0.1306304931640625, 0.148162841796875, 0.1656951904296875, 0.1832275390625, 0.2007598876953125, 0.218292236328125, 0.2358245849609375, 0.25335693359375, 0.2708892822265625, 0.288421630859375, 0.3059539794921875, 0.323486328125, 0.3410186767578125, 0.358551025390625, 0.3760833740234375, 0.39361572265625, 0.4111480712890625, 0.428680419921875, 0.4462127685546875, 0.4637451171875, 0.4812774658203125, 0.498809814453125, 0.5163421630859375, 0.53387451171875, 0.5514068603515625, 0.568939208984375, 0.5864715576171875, 0.60400390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 12.0, 36.0, 79.0, 196.0, 610.0, 3402.0, 1027021.0, 15698.0, 971.0, 298.0, 112.0, 56.0, 19.0, 13.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.1197509765625, -3.007080078125, -2.8944091796875, -2.78173828125, -2.6690673828125, -2.556396484375, -2.4437255859375, -2.3310546875, -2.2183837890625, -2.105712890625, -1.9930419921875, -1.88037109375, -1.7677001953125, -1.655029296875, -1.5423583984375, -1.4296875, -1.3170166015625, -1.204345703125, -1.0916748046875, -0.97900390625, -0.8663330078125, -0.753662109375, -0.6409912109375, -0.5283203125, -0.4156494140625, -0.302978515625, -0.1903076171875, -0.07763671875, 0.0350341796875, 0.147705078125, 0.2603759765625, 0.373046875, 0.4857177734375, 0.598388671875, 0.7110595703125, 0.82373046875, 0.9364013671875, 1.049072265625, 1.1617431640625, 1.2744140625, 1.3870849609375, 1.499755859375, 1.6124267578125, 1.72509765625, 1.8377685546875, 1.950439453125, 2.0631103515625, 2.17578125, 2.2884521484375, 2.401123046875, 2.5137939453125, 2.62646484375, 2.7391357421875, 2.851806640625, 2.9644775390625, 3.0771484375, 3.1898193359375, 3.302490234375, 3.4151611328125, 3.52783203125, 3.6405029296875, 3.753173828125, 3.8658447265625, 3.978515625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 10.0, 28.0, 92.0, 268.0, 270.0, 209.0, 95.0, 27.0, 10.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.91046142578125, -7.6802978515625, -7.45013427734375, -7.219970703125, -6.98980712890625, -6.7596435546875, -6.52947998046875, -6.29931640625, -6.06915283203125, -5.8389892578125, -5.60882568359375, -5.378662109375, -5.14849853515625, -4.9183349609375, -4.68817138671875, -4.4580078125, -4.22784423828125, -3.9976806640625, -3.76751708984375, -3.537353515625, -3.30718994140625, -3.0770263671875, -2.84686279296875, -2.61669921875, -2.38653564453125, -2.1563720703125, -1.92620849609375, -1.696044921875, -1.46588134765625, -1.2357177734375, -1.00555419921875, -0.775390625, -0.54522705078125, -0.3150634765625, -0.08489990234375, 0.145263671875, 0.37542724609375, 0.6055908203125, 0.83575439453125, 1.06591796875, 1.29608154296875, 1.5262451171875, 1.75640869140625, 1.986572265625, 2.21673583984375, 2.4468994140625, 2.67706298828125, 2.9072265625, 3.13739013671875, 3.3675537109375, 3.59771728515625, 3.827880859375, 4.05804443359375, 4.2882080078125, 4.51837158203125, 4.74853515625, 4.97869873046875, 5.2088623046875, 5.43902587890625, 5.669189453125, 5.89935302734375, 6.1295166015625, 6.35968017578125, 6.58984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 11.0, 31.0, 120.0, 1040.0, 1042332.0, 4711.0, 225.0, 45.0, 19.0, 10.0, 3.0, 6.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.202667236328125, -4.09674072265625, -3.990814208984375, -3.8848876953125, -3.778961181640625, -3.67303466796875, -3.567108154296875, -3.461181640625, -3.355255126953125, -3.24932861328125, -3.143402099609375, -3.0374755859375, -2.931549072265625, -2.82562255859375, -2.719696044921875, -2.61376953125, -2.507843017578125, -2.40191650390625, -2.295989990234375, -2.1900634765625, -2.084136962890625, -1.97821044921875, -1.872283935546875, -1.766357421875, -1.660430908203125, -1.55450439453125, -1.448577880859375, -1.3426513671875, -1.236724853515625, -1.13079833984375, -1.024871826171875, -0.9189453125, -0.813018798828125, -0.70709228515625, -0.601165771484375, -0.4952392578125, -0.389312744140625, -0.28338623046875, -0.177459716796875, -0.071533203125, 0.034393310546875, 0.14031982421875, 0.246246337890625, 0.3521728515625, 0.458099365234375, 0.56402587890625, 0.669952392578125, 0.77587890625, 0.881805419921875, 0.98773193359375, 1.093658447265625, 1.1995849609375, 1.305511474609375, 1.41143798828125, 1.517364501953125, 1.623291015625, 1.729217529296875, 1.83514404296875, 1.941070556640625, 2.0469970703125, 2.152923583984375, 2.25885009765625, 2.364776611328125, 2.470703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 5.0, 9.0, 7.0, 4.0, 10.0, 8.0, 17.0, 19.0, 32.0, 26.0, 57.0, 68.0, 122.0, 171.0, 132.0, 76.0, 56.0, 38.0, 37.0, 22.0, 14.0, 5.0, 6.0, 11.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010693073272705078, -0.00010365061461925507, -0.00010037049651145935, -9.709037840366364e-05, -9.381026029586792e-05, -9.05301421880722e-05, -8.725002408027649e-05, -8.396990597248077e-05, -8.068978786468506e-05, -7.740966975688934e-05, -7.412955164909363e-05, -7.084943354129791e-05, -6.75693154335022e-05, -6.428919732570648e-05, -6.1009079217910767e-05, -5.772896111011505e-05, -5.4448843002319336e-05, -5.116872489452362e-05, -4.7888606786727905e-05, -4.460848867893219e-05, -4.1328370571136475e-05, -3.804825246334076e-05, -3.4768134355545044e-05, -3.148801624774933e-05, -2.8207898139953613e-05, -2.4927780032157898e-05, -2.1647661924362183e-05, -1.8367543816566467e-05, -1.5087425708770752e-05, -1.1807307600975037e-05, -8.527189493179321e-06, -5.247071385383606e-06, -1.9669532775878906e-06, 1.3131648302078247e-06, 4.59328293800354e-06, 7.873401045799255e-06, 1.115351915359497e-05, 1.4433637261390686e-05, 1.77137553691864e-05, 2.0993873476982117e-05, 2.4273991584777832e-05, 2.7554109692573547e-05, 3.083422780036926e-05, 3.411434590816498e-05, 3.739446401596069e-05, 4.067458212375641e-05, 4.3954700231552124e-05, 4.723481833934784e-05, 5.0514936447143555e-05, 5.379505455493927e-05, 5.7075172662734985e-05, 6.03552907705307e-05, 6.363540887832642e-05, 6.691552698612213e-05, 7.019564509391785e-05, 7.347576320171356e-05, 7.675588130950928e-05, 8.003599941730499e-05, 8.331611752510071e-05, 8.659623563289642e-05, 8.987635374069214e-05, 9.315647184848785e-05, 9.643658995628357e-05, 9.971670806407928e-05, 0.000102996826171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 19.0, 95.0, 365.0, 8637.0, 1037654.0, 1500.0, 188.0, 57.0, 16.0, 8.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.142578125, -2.05438232421875, -1.9661865234375, -1.87799072265625, -1.789794921875, -1.70159912109375, -1.6134033203125, -1.52520751953125, -1.43701171875, -1.34881591796875, -1.2606201171875, -1.17242431640625, -1.084228515625, -0.99603271484375, -0.9078369140625, -0.81964111328125, -0.7314453125, -0.64324951171875, -0.5550537109375, -0.46685791015625, -0.378662109375, -0.29046630859375, -0.2022705078125, -0.11407470703125, -0.02587890625, 0.06231689453125, 0.1505126953125, 0.23870849609375, 0.326904296875, 0.41510009765625, 0.5032958984375, 0.59149169921875, 0.6796875, 0.76788330078125, 0.8560791015625, 0.94427490234375, 1.032470703125, 1.12066650390625, 1.2088623046875, 1.29705810546875, 1.38525390625, 1.47344970703125, 1.5616455078125, 1.64984130859375, 1.738037109375, 1.82623291015625, 1.9144287109375, 2.00262451171875, 2.0908203125, 2.17901611328125, 2.2672119140625, 2.35540771484375, 2.443603515625, 2.53179931640625, 2.6199951171875, 2.70819091796875, 2.79638671875, 2.88458251953125, 2.9727783203125, 3.06097412109375, 3.149169921875, 3.23736572265625, 3.3255615234375, 3.41375732421875, 3.501953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 14.0, 55.0, 432.0, 407.0, 54.0, 20.0, 5.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.071685791015625, -1.00860595703125, -0.945526123046875, -0.8824462890625, -0.819366455078125, -0.75628662109375, -0.693206787109375, -0.630126953125, -0.567047119140625, -0.50396728515625, -0.440887451171875, -0.3778076171875, -0.314727783203125, -0.25164794921875, -0.188568115234375, -0.12548828125, -0.062408447265625, 0.00067138671875, 0.063751220703125, 0.1268310546875, 0.189910888671875, 0.25299072265625, 0.316070556640625, 0.379150390625, 0.442230224609375, 0.50531005859375, 0.568389892578125, 0.6314697265625, 0.694549560546875, 0.75762939453125, 0.820709228515625, 0.8837890625, 0.946868896484375, 1.00994873046875, 1.073028564453125, 1.1361083984375, 1.199188232421875, 1.26226806640625, 1.325347900390625, 1.388427734375, 1.451507568359375, 1.51458740234375, 1.577667236328125, 1.6407470703125, 1.703826904296875, 1.76690673828125, 1.829986572265625, 1.89306640625, 1.956146240234375, 2.01922607421875, 2.082305908203125, 2.1453857421875, 2.208465576171875, 2.27154541015625, 2.334625244140625, 2.397705078125, 2.460784912109375, 2.52386474609375, 2.586944580078125, 2.6500244140625, 2.713104248046875, 2.77618408203125, 2.839263916015625, 2.90234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 20.0, 52.0, 345.0, 510.0, 44.0, 12.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40204620361328, -37.2132682800293, -36.02449035644531, -34.83570861816406, -33.64693069458008, -32.458152770996094, -31.26937484741211, -30.080595016479492, -28.891815185546875, -27.70303726196289, -26.514257431030273, -25.32547950744629, -24.136699676513672, -22.947921752929688, -21.759143829345703, -20.570363998413086, -19.3815860748291, -18.192808151245117, -17.0040283203125, -15.815250396728516, -14.626470565795898, -13.437692642211914, -12.248913764953613, -11.060134887695312, -9.871356010437012, -8.682577133178711, -7.49379825592041, -6.305019855499268, -5.116240978240967, -3.927462100982666, -2.7386837005615234, -1.5499048233032227, -0.3611259460449219, 0.8276528120040894, 2.0164315700531006, 3.2052102088928223, 4.393989086151123, 5.582767963409424, 6.771546363830566, 7.960325241088867, 9.149104118347168, 10.337882995605469, 11.52666187286377, 12.71544075012207, 13.904218673706055, 15.092998504638672, 16.281776428222656, 17.47055435180664, 18.659334182739258, 19.848112106323242, 21.03689193725586, 22.225669860839844, 23.41444969177246, 24.603227615356445, 25.792007446289062, 26.980785369873047, 28.16956329345703, 29.358341217041016, 30.547121047973633, 31.735898971557617, 32.924678802490234, 34.11345672607422, 35.3022346496582, 36.49101257324219, 37.67979431152344]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 3.0, 6.0, 5.0, 10.0, 14.0, 18.0, 23.0, 27.0, 45.0, 29.0, 32.0, 46.0, 57.0, 63.0, 75.0, 60.0, 58.0, 63.0, 71.0, 45.0, 45.0, 50.0, 25.0, 23.0, 25.0, 14.0, 17.0, 9.0, 6.0, 9.0, 5.0, 11.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-16.041461944580078, -15.645145416259766, -15.248828887939453, -14.852511405944824, -14.456194877624512, -14.0598783493042, -13.66356086730957, -13.267244338989258, -12.870927810668945, -12.474611282348633, -12.07829475402832, -11.681977272033691, -11.285660743713379, -10.889344215393066, -10.493026733398438, -10.096710205078125, -9.700393676757812, -9.3040771484375, -8.907760620117188, -8.511443138122559, -8.115126609802246, -7.718810081481934, -7.322493076324463, -6.926176071166992, -6.52985954284668, -6.133543014526367, -5.7372260093688965, -5.340909004211426, -4.944592475891113, -4.548275947570801, -4.15195894241333, -3.7556421756744385, -3.359325408935547, -2.9630086421966553, -2.5666918754577637, -2.170375108718872, -1.7740583419799805, -1.3777415752410889, -0.9814248085021973, -0.5851080417633057, -0.18879127502441406, 0.20752549171447754, 0.6038422584533691, 1.0001590251922607, 1.3964757919311523, 1.792792558670044, 2.1891093254089355, 2.585426092147827, 2.9817428588867188, 3.3780596256256104, 3.774376392364502, 4.170693397521973, 4.567009925842285, 4.963326454162598, 5.359643459320068, 5.755960464477539, 6.152276992797852, 6.548593521118164, 6.944910526275635, 7.3412275314331055, 7.737544059753418, 8.13386058807373, 8.53017807006836, 8.926494598388672, 9.322811126708984]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 8.0, 15.0, 15.0, 23.0, 32.0, 49.0, 84.0, 113.0, 157.0, 258.0, 356.0, 660.0, 1124.0, 1924.0, 3987.0, 8995.0, 26012.0, 142763.0, 3075730.0, 846898.0, 56645.0, 15315.0, 6033.0, 2909.0, 1611.0, 891.0, 573.0, 347.0, 219.0, 163.0, 98.0, 64.0, 54.0, 48.0, 28.0, 14.0, 18.0, 6.0, 8.0, 4.0, 7.0, 4.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.357421875, -0.3468437194824219, -0.33626556396484375, -0.3256874084472656, -0.3151092529296875, -0.3045310974121094, -0.29395294189453125, -0.2833747863769531, -0.272796630859375, -0.2622184753417969, -0.25164031982421875, -0.24106216430664062, -0.2304840087890625, -0.21990585327148438, -0.20932769775390625, -0.19874954223632812, -0.18817138671875, -0.17759323120117188, -0.16701507568359375, -0.15643692016601562, -0.1458587646484375, -0.13528060913085938, -0.12470245361328125, -0.11412429809570312, -0.103546142578125, -0.09296798706054688, -0.08238983154296875, -0.07181167602539062, -0.0612335205078125, -0.050655364990234375, -0.04007720947265625, -0.029499053955078125, -0.0189208984375, -0.008342742919921875, 0.00223541259765625, 0.012813568115234375, 0.0233917236328125, 0.033969879150390625, 0.04454803466796875, 0.055126190185546875, 0.065704345703125, 0.07628250122070312, 0.08686065673828125, 0.09743881225585938, 0.1080169677734375, 0.11859512329101562, 0.12917327880859375, 0.13975143432617188, 0.15032958984375, 0.16090774536132812, 0.17148590087890625, 0.18206405639648438, 0.1926422119140625, 0.20322036743164062, 0.21379852294921875, 0.22437667846679688, 0.234954833984375, 0.24553298950195312, 0.25611114501953125, 0.2666893005371094, 0.2772674560546875, 0.2878456115722656, 0.29842376708984375, 0.3090019226074219, 0.319580078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 6.0, 3.0, 13.0, 19.0, 19.0, 27.0, 27.0, 49.0, 56.0, 68.0, 70.0, 88.0, 74.0, 88.0, 79.0, 68.0, 65.0, 36.0, 23.0, 36.0, 29.0, 14.0, 8.0, 5.0, 7.0, 5.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395751953125, -0.3832664489746094, -0.37078094482421875, -0.3582954406738281, -0.3458099365234375, -0.3333244323730469, -0.32083892822265625, -0.3083534240722656, -0.295867919921875, -0.2833824157714844, -0.27089691162109375, -0.2584114074707031, -0.2459259033203125, -0.23344039916992188, -0.22095489501953125, -0.20846939086914062, -0.19598388671875, -0.18349838256835938, -0.17101287841796875, -0.15852737426757812, -0.1460418701171875, -0.13355636596679688, -0.12107086181640625, -0.10858535766601562, -0.096099853515625, -0.08361434936523438, -0.07112884521484375, -0.058643341064453125, -0.0461578369140625, -0.033672332763671875, -0.02118682861328125, -0.008701324462890625, 0.0037841796875, 0.016269683837890625, 0.02875518798828125, 0.041240692138671875, 0.0537261962890625, 0.06621170043945312, 0.07869720458984375, 0.09118270874023438, 0.103668212890625, 0.11615371704101562, 0.12863922119140625, 0.14112472534179688, 0.1536102294921875, 0.16609573364257812, 0.17858123779296875, 0.19106674194335938, 0.20355224609375, 0.21603775024414062, 0.22852325439453125, 0.24100875854492188, 0.2534942626953125, 0.2659797668457031, 0.27846527099609375, 0.2909507751464844, 0.303436279296875, 0.3159217834472656, 0.32840728759765625, 0.3408927917480469, 0.3533782958984375, 0.3658638000488281, 0.37834930419921875, 0.3908348083496094, 0.4033203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 3.0, 3.0, 11.0, 15.0, 36.0, 50.0, 61.0, 114.0, 199.0, 493.0, 1254.0, 4833.0, 23698.0, 950106.0, 3172635.0, 31834.0, 6083.0, 1570.0, 594.0, 281.0, 136.0, 91.0, 60.0, 42.0, 25.0, 16.0, 5.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.79150390625, -0.7651748657226562, -0.7388458251953125, -0.7125167846679688, -0.686187744140625, -0.6598587036132812, -0.6335296630859375, -0.6072006225585938, -0.58087158203125, -0.5545425415039062, -0.5282135009765625, -0.5018844604492188, -0.475555419921875, -0.44922637939453125, -0.4228973388671875, -0.39656829833984375, -0.3702392578125, -0.34391021728515625, -0.3175811767578125, -0.29125213623046875, -0.264923095703125, -0.23859405517578125, -0.2122650146484375, -0.18593597412109375, -0.15960693359375, -0.13327789306640625, -0.1069488525390625, -0.08061981201171875, -0.054290771484375, -0.02796173095703125, -0.0016326904296875, 0.02469635009765625, 0.051025390625, 0.07735443115234375, 0.1036834716796875, 0.13001251220703125, 0.156341552734375, 0.18267059326171875, 0.2089996337890625, 0.23532867431640625, 0.26165771484375, 0.28798675537109375, 0.3143157958984375, 0.34064483642578125, 0.366973876953125, 0.39330291748046875, 0.4196319580078125, 0.44596099853515625, 0.4722900390625, 0.49861907958984375, 0.5249481201171875, 0.5512771606445312, 0.577606201171875, 0.6039352416992188, 0.6302642822265625, 0.6565933227539062, 0.68292236328125, 0.7092514038085938, 0.7355804443359375, 0.7619094848632812, 0.788238525390625, 0.8145675659179688, 0.8408966064453125, 0.8672256469726562, 0.8935546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 3.0, 11.0, 6.0, 18.0, 37.0, 80.0, 347.0, 2406.0, 825.0, 159.0, 58.0, 31.0, 29.0, 10.0, 20.0, 7.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447265625, -0.8074188232421875, -0.770111083984375, -0.7328033447265625, -0.69549560546875, -0.6581878662109375, -0.620880126953125, -0.5835723876953125, -0.5462646484375, -0.5089569091796875, -0.471649169921875, -0.4343414306640625, -0.39703369140625, -0.3597259521484375, -0.322418212890625, -0.2851104736328125, -0.247802734375, -0.2104949951171875, -0.173187255859375, -0.1358795166015625, -0.09857177734375, -0.0612640380859375, -0.023956298828125, 0.0133514404296875, 0.0506591796875, 0.0879669189453125, 0.125274658203125, 0.1625823974609375, 0.19989013671875, 0.2371978759765625, 0.274505615234375, 0.3118133544921875, 0.34912109375, 0.3864288330078125, 0.423736572265625, 0.4610443115234375, 0.49835205078125, 0.5356597900390625, 0.572967529296875, 0.6102752685546875, 0.6475830078125, 0.6848907470703125, 0.722198486328125, 0.7595062255859375, 0.79681396484375, 0.8341217041015625, 0.871429443359375, 0.9087371826171875, 0.946044921875, 0.9833526611328125, 1.020660400390625, 1.0579681396484375, 1.09527587890625, 1.1325836181640625, 1.169891357421875, 1.2071990966796875, 1.2445068359375, 1.2818145751953125, 1.319122314453125, 1.3564300537109375, 1.39373779296875, 1.4310455322265625, 1.468353271484375, 1.5056610107421875, 1.54296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 10.0, 34.0, 180.0, 446.0, 201.0, 46.0, 28.0, 12.0, 6.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4840898513793945, -7.1733880043029785, -6.8626861572265625, -6.5519843101501465, -6.2412824630737305, -5.930580139160156, -5.61987829208374, -5.309176445007324, -4.998474597930908, -4.687772750854492, -4.377070903778076, -4.06636905670166, -3.755666971206665, -3.444965124130249, -3.134263038635254, -2.823561191558838, -2.512859344482422, -2.202157497406006, -1.8914555311203003, -1.5807535648345947, -1.2700517177581787, -0.9593498706817627, -0.6486479043960571, -0.33794593811035156, -0.027244091033935547, 0.28345781564712524, 0.594159722328186, 0.9048616290092468, 1.2155635356903076, 1.5262653827667236, 1.8369673490524292, 2.1476693153381348, 2.458372116088867, 2.769073963165283, 3.079775810241699, 3.3904778957366943, 3.7011797428131104, 4.0118818283081055, 4.3225836753845215, 4.6332855224609375, 4.9439873695373535, 5.2546892166137695, 5.5653910636901855, 5.876092910766602, 6.186795234680176, 6.497496604919434, 6.808198928833008, 7.118900775909424, 7.42960262298584, 7.740304470062256, 8.051006317138672, 8.361708641052246, 8.672410011291504, 8.983112335205078, 9.293813705444336, 9.60451602935791, 9.915218353271484, 10.225920677185059, 10.536622047424316, 10.84732437133789, 11.158025741577148, 11.468728065490723, 11.77942943572998, 12.090131759643555, 12.400833129882812]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 15.0, 15.0, 16.0, 27.0, 30.0, 40.0, 58.0, 44.0, 46.0, 77.0, 66.0, 64.0, 60.0, 56.0, 64.0, 41.0, 59.0, 50.0, 30.0, 15.0, 20.0, 21.0, 17.0, 20.0, 8.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.888029098510742, -4.734557151794434, -4.581085205078125, -4.427613258361816, -4.274141311645508, -4.120669364929199, -3.9671971797943115, -3.813724994659424, -3.6602530479431152, -3.5067811012268066, -3.353309154510498, -3.1998372077941895, -3.0463650226593018, -2.892893075942993, -2.7394211292266846, -2.585948944091797, -2.4324772357940674, -2.279005289077759, -2.12553334236145, -1.972061276435852, -1.818589210510254, -1.6651172637939453, -1.5116453170776367, -1.3581732511520386, -1.20470130443573, -1.0512293577194214, -0.8977572917938232, -0.7442853450775146, -0.5908133387565613, -0.4373413324356079, -0.2838693857192993, -0.13039731979370117, 0.023074626922607422, 0.1765466183423996, 0.3300186097621918, 0.48349058628082275, 0.6369625926017761, 0.7904345989227295, 0.9439065456390381, 1.0973786115646362, 1.2508505582809448, 1.4043225049972534, 1.5577945709228516, 1.7112665176391602, 1.8647384643554688, 2.0182104110717773, 2.171682357788086, 2.3251545429229736, 2.4786264896392822, 2.632098436355591, 2.7855703830718994, 2.939042568206787, 3.0925145149230957, 3.2459864616394043, 3.399458408355713, 3.5529303550720215, 3.70640230178833, 3.8598742485046387, 4.013346195220947, 4.166818141937256, 4.3202900886535645, 4.473762512207031, 4.62723445892334, 4.780706405639648, 4.934178352355957]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 8.0, 10.0, 14.0, 16.0, 25.0, 37.0, 34.0, 73.0, 87.0, 125.0, 202.0, 318.0, 474.0, 761.0, 1152.0, 1863.0, 3066.0, 5579.0, 10167.0, 20131.0, 43628.0, 105611.0, 262116.0, 329765.0, 147640.0, 59636.0, 26444.0, 12748.0, 6881.0, 3821.0, 2283.0, 1349.0, 839.0, 585.0, 328.0, 232.0, 153.0, 102.0, 70.0, 57.0, 38.0, 14.0, 17.0, 18.0, 11.0, 11.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-0.2333984375, -0.22657012939453125, -0.2197418212890625, -0.21291351318359375, -0.206085205078125, -0.19925689697265625, -0.1924285888671875, -0.18560028076171875, -0.17877197265625, -0.17194366455078125, -0.1651153564453125, -0.15828704833984375, -0.151458740234375, -0.14463043212890625, -0.1378021240234375, -0.13097381591796875, -0.1241455078125, -0.11731719970703125, -0.1104888916015625, -0.10366058349609375, -0.096832275390625, -0.09000396728515625, -0.0831756591796875, -0.07634735107421875, -0.06951904296875, -0.06269073486328125, -0.0558624267578125, -0.04903411865234375, -0.042205810546875, -0.03537750244140625, -0.0285491943359375, -0.02172088623046875, -0.014892578125, -0.00806427001953125, -0.0012359619140625, 0.00559234619140625, 0.012420654296875, 0.01924896240234375, 0.0260772705078125, 0.03290557861328125, 0.03973388671875, 0.04656219482421875, 0.0533905029296875, 0.06021881103515625, 0.067047119140625, 0.07387542724609375, 0.0807037353515625, 0.08753204345703125, 0.0943603515625, 0.10118865966796875, 0.1080169677734375, 0.11484527587890625, 0.121673583984375, 0.12850189208984375, 0.1353302001953125, 0.14215850830078125, 0.14898681640625, 0.15581512451171875, 0.1626434326171875, 0.16947174072265625, 0.176300048828125, 0.18312835693359375, 0.1899566650390625, 0.19678497314453125, 0.20361328125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 6.0, 10.0, 12.0, 14.0, 18.0, 17.0, 20.0, 30.0, 34.0, 32.0, 44.0, 58.0, 61.0, 64.0, 58.0, 55.0, 66.0, 60.0, 41.0, 56.0, 41.0, 36.0, 35.0, 26.0, 14.0, 14.0, 13.0, 8.0, 9.0, 8.0, 4.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.278839111328125, -0.26959228515625, -0.260345458984375, -0.2510986328125, -0.241851806640625, -0.23260498046875, -0.223358154296875, -0.214111328125, -0.204864501953125, -0.19561767578125, -0.186370849609375, -0.1771240234375, -0.167877197265625, -0.15863037109375, -0.149383544921875, -0.14013671875, -0.130889892578125, -0.12164306640625, -0.112396240234375, -0.1031494140625, -0.093902587890625, -0.08465576171875, -0.075408935546875, -0.066162109375, -0.056915283203125, -0.04766845703125, -0.038421630859375, -0.0291748046875, -0.019927978515625, -0.01068115234375, -0.001434326171875, 0.0078125, 0.017059326171875, 0.02630615234375, 0.035552978515625, 0.0447998046875, 0.054046630859375, 0.06329345703125, 0.072540283203125, 0.081787109375, 0.091033935546875, 0.10028076171875, 0.109527587890625, 0.1187744140625, 0.128021240234375, 0.13726806640625, 0.146514892578125, 0.15576171875, 0.165008544921875, 0.17425537109375, 0.183502197265625, 0.1927490234375, 0.201995849609375, 0.21124267578125, 0.220489501953125, 0.229736328125, 0.238983154296875, 0.24822998046875, 0.257476806640625, 0.2667236328125, 0.275970458984375, 0.28521728515625, 0.294464111328125, 0.3037109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 5.0, 9.0, 16.0, 25.0, 30.0, 42.0, 65.0, 110.0, 143.0, 267.0, 452.0, 826.0, 2134.0, 10171.0, 252106.0, 757745.0, 19040.0, 3056.0, 987.0, 515.0, 277.0, 160.0, 105.0, 90.0, 58.0, 45.0, 14.0, 16.0, 13.0, 6.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9794921875, -0.946990966796875, -0.91448974609375, -0.881988525390625, -0.8494873046875, -0.816986083984375, -0.78448486328125, -0.751983642578125, -0.719482421875, -0.686981201171875, -0.65447998046875, -0.621978759765625, -0.5894775390625, -0.556976318359375, -0.52447509765625, -0.491973876953125, -0.45947265625, -0.426971435546875, -0.39447021484375, -0.361968994140625, -0.3294677734375, -0.296966552734375, -0.26446533203125, -0.231964111328125, -0.199462890625, -0.166961669921875, -0.13446044921875, -0.101959228515625, -0.0694580078125, -0.036956787109375, -0.00445556640625, 0.028045654296875, 0.060546875, 0.093048095703125, 0.12554931640625, 0.158050537109375, 0.1905517578125, 0.223052978515625, 0.25555419921875, 0.288055419921875, 0.320556640625, 0.353057861328125, 0.38555908203125, 0.418060302734375, 0.4505615234375, 0.483062744140625, 0.51556396484375, 0.548065185546875, 0.58056640625, 0.613067626953125, 0.64556884765625, 0.678070068359375, 0.7105712890625, 0.743072509765625, 0.77557373046875, 0.808074951171875, 0.840576171875, 0.873077392578125, 0.90557861328125, 0.938079833984375, 0.9705810546875, 1.003082275390625, 1.03558349609375, 1.068084716796875, 1.1005859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 7.0, 11.0, 10.0, 17.0, 16.0, 24.0, 42.0, 46.0, 47.0, 69.0, 64.0, 80.0, 69.0, 74.0, 88.0, 55.0, 45.0, 53.0, 49.0, 36.0, 11.0, 30.0, 14.0, 11.0, 6.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -1.9956512451171875, -1.938568115234375, -1.8814849853515625, -1.82440185546875, -1.7673187255859375, -1.710235595703125, -1.6531524658203125, -1.5960693359375, -1.5389862060546875, -1.481903076171875, -1.4248199462890625, -1.36773681640625, -1.3106536865234375, -1.253570556640625, -1.1964874267578125, -1.139404296875, -1.0823211669921875, -1.025238037109375, -0.9681549072265625, -0.91107177734375, -0.8539886474609375, -0.796905517578125, -0.7398223876953125, -0.6827392578125, -0.6256561279296875, -0.568572998046875, -0.5114898681640625, -0.45440673828125, -0.3973236083984375, -0.340240478515625, -0.2831573486328125, -0.22607421875, -0.1689910888671875, -0.111907958984375, -0.0548248291015625, 0.00225830078125, 0.0593414306640625, 0.116424560546875, 0.1735076904296875, 0.2305908203125, 0.2876739501953125, 0.344757080078125, 0.4018402099609375, 0.45892333984375, 0.5160064697265625, 0.573089599609375, 0.6301727294921875, 0.687255859375, 0.7443389892578125, 0.801422119140625, 0.8585052490234375, 0.91558837890625, 0.9726715087890625, 1.029754638671875, 1.0868377685546875, 1.1439208984375, 1.2010040283203125, 1.258087158203125, 1.3151702880859375, 1.37225341796875, 1.4293365478515625, 1.486419677734375, 1.5435028076171875, 1.6005859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 11.0, 10.0, 24.0, 42.0, 74.0, 99.0, 187.0, 422.0, 1192.0, 5295.0, 80168.0, 926413.0, 29718.0, 3313.0, 856.0, 324.0, 148.0, 100.0, 46.0, 30.0, 25.0, 11.0, 10.0, 2.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.447509765625, -0.4355316162109375, -0.423553466796875, -0.4115753173828125, -0.39959716796875, -0.3876190185546875, -0.375640869140625, -0.3636627197265625, -0.3516845703125, -0.3397064208984375, -0.327728271484375, -0.3157501220703125, -0.30377197265625, -0.2917938232421875, -0.279815673828125, -0.2678375244140625, -0.255859375, -0.2438812255859375, -0.231903076171875, -0.2199249267578125, -0.20794677734375, -0.1959686279296875, -0.183990478515625, -0.1720123291015625, -0.1600341796875, -0.1480560302734375, -0.136077880859375, -0.1240997314453125, -0.11212158203125, -0.1001434326171875, -0.088165283203125, -0.0761871337890625, -0.064208984375, -0.0522308349609375, -0.040252685546875, -0.0282745361328125, -0.01629638671875, -0.0043182373046875, 0.007659912109375, 0.0196380615234375, 0.0316162109375, 0.0435943603515625, 0.055572509765625, 0.0675506591796875, 0.07952880859375, 0.0915069580078125, 0.103485107421875, 0.1154632568359375, 0.12744140625, 0.1394195556640625, 0.151397705078125, 0.1633758544921875, 0.17535400390625, 0.1873321533203125, 0.199310302734375, 0.2112884521484375, 0.2232666015625, 0.2352447509765625, 0.247222900390625, 0.2592010498046875, 0.27117919921875, 0.2831573486328125, 0.295135498046875, 0.3071136474609375, 0.319091796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 0.0, 2.0, 4.0, 8.0, 7.0, 7.0, 8.0, 16.0, 27.0, 19.0, 36.0, 66.0, 108.0, 188.0, 176.0, 114.0, 63.0, 38.0, 25.0, 16.0, 15.0, 17.0, 8.0, 5.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001633167266845703, -0.00015837885439395905, -0.00015344098210334778, -0.0001485031098127365, -0.00014356523752212524, -0.00013862736523151398, -0.0001336894929409027, -0.00012875162065029144, -0.00012381374835968018, -0.00011887587606906891, -0.00011393800377845764, -0.00010900013148784637, -0.00010406225919723511, -9.912438690662384e-05, -9.418651461601257e-05, -8.92486423254013e-05, -8.431077003479004e-05, -7.937289774417877e-05, -7.44350254535675e-05, -6.949715316295624e-05, -6.455928087234497e-05, -5.9621408581733704e-05, -5.4683536291122437e-05, -4.974566400051117e-05, -4.48077917098999e-05, -3.9869919419288635e-05, -3.493204712867737e-05, -2.99941748380661e-05, -2.5056302547454834e-05, -2.0118430256843567e-05, -1.51805579662323e-05, -1.0242685675621033e-05, -5.304813385009766e-06, -3.6694109439849854e-07, 4.5709311962127686e-06, 9.508803486824036e-06, 1.4446675777435303e-05, 1.938454806804657e-05, 2.4322420358657837e-05, 2.9260292649269104e-05, 3.419816493988037e-05, 3.913603723049164e-05, 4.4073909521102905e-05, 4.901178181171417e-05, 5.394965410232544e-05, 5.8887526392936707e-05, 6.382539868354797e-05, 6.876327097415924e-05, 7.370114326477051e-05, 7.863901555538177e-05, 8.357688784599304e-05, 8.851476013660431e-05, 9.345263242721558e-05, 9.839050471782684e-05, 0.00010332837700843811, 0.00010826624929904938, 0.00011320412158966064, 0.00011814199388027191, 0.00012307986617088318, 0.00012801773846149445, 0.0001329556107521057, 0.00013789348304271698, 0.00014283135533332825, 0.00014776922762393951, 0.00015270709991455078]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 1.0, 11.0, 10.0, 15.0, 20.0, 33.0, 44.0, 82.0, 128.0, 263.0, 536.0, 1458.0, 6179.0, 72894.0, 906975.0, 52205.0, 5315.0, 1313.0, 486.0, 232.0, 142.0, 90.0, 52.0, 14.0, 23.0, 9.0, 9.0, 5.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.2172260284423828, -0.20605850219726562, -0.19489097595214844, -0.18372344970703125, -0.17255592346191406, -0.16138839721679688, -0.1502208709716797, -0.1390533447265625, -0.1278858184814453, -0.11671829223632812, -0.10555076599121094, -0.09438323974609375, -0.08321571350097656, -0.07204818725585938, -0.06088066101074219, -0.049713134765625, -0.03854560852050781, -0.027378082275390625, -0.016210556030273438, -0.00504302978515625, 0.0061244964599609375, 0.017292022705078125, 0.028459548950195312, 0.0396270751953125, 0.05079460144042969, 0.061962127685546875, 0.07312965393066406, 0.08429718017578125, 0.09546470642089844, 0.10663223266601562, 0.11779975891113281, 0.12896728515625, 0.1401348114013672, 0.15130233764648438, 0.16246986389160156, 0.17363739013671875, 0.18480491638183594, 0.19597244262695312, 0.2071399688720703, 0.2183074951171875, 0.2294750213623047, 0.24064254760742188, 0.25181007385253906, 0.26297760009765625, 0.27414512634277344, 0.2853126525878906, 0.2964801788330078, 0.307647705078125, 0.3188152313232422, 0.3299827575683594, 0.34115028381347656, 0.35231781005859375, 0.36348533630371094, 0.3746528625488281, 0.3858203887939453, 0.3969879150390625, 0.4081554412841797, 0.4193229675292969, 0.43049049377441406, 0.44165802001953125, 0.45282554626464844, 0.4639930725097656, 0.4751605987548828, 0.486328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 5.0, 11.0, 8.0, 10.0, 20.0, 23.0, 15.0, 34.0, 51.0, 39.0, 54.0, 68.0, 54.0, 78.0, 64.0, 74.0, 71.0, 54.0, 49.0, 56.0, 32.0, 25.0, 22.0, 9.0, 15.0, 10.0, 8.0, 2.0, 12.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.302734375, -0.29532814025878906, -0.2879219055175781, -0.2805156707763672, -0.27310943603515625, -0.2657032012939453, -0.2582969665527344, -0.25089073181152344, -0.2434844970703125, -0.23607826232910156, -0.22867202758789062, -0.2212657928466797, -0.21385955810546875, -0.2064533233642578, -0.19904708862304688, -0.19164085388183594, -0.184234619140625, -0.17682838439941406, -0.16942214965820312, -0.1620159149169922, -0.15460968017578125, -0.1472034454345703, -0.13979721069335938, -0.13239097595214844, -0.1249847412109375, -0.11757850646972656, -0.11017227172851562, -0.10276603698730469, -0.09535980224609375, -0.08795356750488281, -0.08054733276367188, -0.07314109802246094, -0.06573486328125, -0.05832862854003906, -0.050922393798828125, -0.04351615905761719, -0.03610992431640625, -0.028703689575195312, -0.021297454833984375, -0.013891220092773438, -0.0064849853515625, 0.0009212493896484375, 0.008327484130859375, 0.015733718872070312, 0.02313995361328125, 0.030546188354492188, 0.037952423095703125, 0.04535865783691406, 0.052764892578125, 0.06017112731933594, 0.06757736206054688, 0.07498359680175781, 0.08238983154296875, 0.08979606628417969, 0.09720230102539062, 0.10460853576660156, 0.1120147705078125, 0.11942100524902344, 0.12682723999023438, 0.1342334747314453, 0.14163970947265625, 0.1490459442138672, 0.15645217895507812, 0.16385841369628906, 0.1712646484375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 14.0, 76.0, 560.0, 283.0, 43.0, 19.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1772518157959, -18.717815399169922, -18.258378982543945, -17.79894256591797, -17.33950424194336, -16.880067825317383, -16.420631408691406, -15.96119499206543, -15.501758575439453, -15.042322158813477, -14.5828857421875, -14.123448371887207, -13.66401195526123, -13.204575538635254, -12.745138168334961, -12.285701751708984, -11.826265335083008, -11.366828918457031, -10.907392501831055, -10.447955131530762, -9.988518714904785, -9.529082298278809, -9.069644927978516, -8.610208511352539, -8.150772094726562, -7.691335678100586, -7.231898784637451, -6.772461891174316, -6.31302547454834, -5.853589057922363, -5.3941521644592285, -4.934715270996094, -4.475277900695801, -4.015841484069824, -3.5564045906066895, -3.096967935562134, -2.637531280517578, -2.1780946254730225, -1.7186579704284668, -1.2592213153839111, -0.7997846603393555, -0.3403480052947998, 0.11908864974975586, 0.5785253047943115, 1.0379619598388672, 1.4973986148834229, 1.9568352699279785, 2.416271924972534, 2.87570858001709, 3.3351452350616455, 3.794581890106201, 4.254018783569336, 4.7134552001953125, 5.172891616821289, 5.632328510284424, 6.091765403747559, 6.551201820373535, 7.010638236999512, 7.4700751304626465, 7.929512023925781, 8.388948440551758, 8.848384857177734, 9.307821273803711, 9.767258644104004, 10.22669506072998]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 8.0, 8.0, 15.0, 9.0, 14.0, 21.0, 31.0, 29.0, 32.0, 52.0, 40.0, 59.0, 67.0, 78.0, 73.0, 65.0, 66.0, 58.0, 48.0, 48.0, 27.0, 29.0, 27.0, 23.0, 20.0, 8.0, 11.0, 10.0, 12.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.539610862731934, -5.338078022003174, -5.136545181274414, -4.935012340545654, -4.7334794998168945, -4.531946182250977, -4.330413341522217, -4.128880500793457, -3.9273476600646973, -3.7258148193359375, -3.5242819786071777, -3.322748899459839, -3.121216058731079, -2.9196832180023193, -2.7181501388549805, -2.5166172981262207, -2.315084457397461, -2.113551616668701, -1.9120186567306519, -1.7104856967926025, -1.5089528560638428, -1.307420015335083, -1.1058870553970337, -0.9043540954589844, -0.7028212547302246, -0.5012883543968201, -0.2997554540634155, -0.09822255373001099, 0.10331034660339355, 0.3048431873321533, 0.5063761472702026, 0.707909107208252, 0.9094424247741699, 1.1109752655029297, 1.312508225440979, 1.5140411853790283, 1.715574026107788, 1.9171068668365479, 2.1186399459838867, 2.3201727867126465, 2.5217056274414062, 2.723238468170166, 2.924771308898926, 3.1263043880462646, 3.3278372287750244, 3.529370069503784, 3.730903148651123, 3.932435989379883, 4.133968830108643, 4.335501670837402, 4.537034511566162, 4.738567352294922, 4.94010066986084, 5.141633033752441, 5.343166351318359, 5.544699192047119, 5.746232032775879, 5.947764873504639, 6.149297714233398, 6.350830554962158, 6.552363395690918, 6.753896713256836, 6.955429553985596, 7.1569623947143555, 7.358495235443115]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 11.0, 10.0, 11.0, 23.0, 10.0, 24.0, 41.0, 62.0, 58.0, 117.0, 292.0, 630.0, 1968.0, 7096.0, 51299.0, 3892196.0, 227285.0, 9238.0, 2112.0, 805.0, 355.0, 194.0, 113.0, 83.0, 53.0, 32.0, 33.0, 21.0, 26.0, 19.0, 12.0, 12.0, 7.0, 3.0, 10.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.66650390625, -0.6467132568359375, -0.626922607421875, -0.6071319580078125, -0.58734130859375, -0.5675506591796875, -0.547760009765625, -0.5279693603515625, -0.5081787109375, -0.4883880615234375, -0.468597412109375, -0.4488067626953125, -0.42901611328125, -0.4092254638671875, -0.389434814453125, -0.3696441650390625, -0.349853515625, -0.3300628662109375, -0.310272216796875, -0.2904815673828125, -0.27069091796875, -0.2509002685546875, -0.231109619140625, -0.2113189697265625, -0.1915283203125, -0.1717376708984375, -0.151947021484375, -0.1321563720703125, -0.11236572265625, -0.0925750732421875, -0.072784423828125, -0.0529937744140625, -0.033203125, -0.0134124755859375, 0.006378173828125, 0.0261688232421875, 0.04595947265625, 0.0657501220703125, 0.085540771484375, 0.1053314208984375, 0.1251220703125, 0.1449127197265625, 0.164703369140625, 0.1844940185546875, 0.20428466796875, 0.2240753173828125, 0.243865966796875, 0.2636566162109375, 0.283447265625, 0.3032379150390625, 0.323028564453125, 0.3428192138671875, 0.36260986328125, 0.3824005126953125, 0.402191162109375, 0.4219818115234375, 0.4417724609375, 0.4615631103515625, 0.481353759765625, 0.5011444091796875, 0.52093505859375, 0.5407257080078125, 0.560516357421875, 0.5803070068359375, 0.60009765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 12.0, 17.0, 23.0, 39.0, 61.0, 81.0, 117.0, 122.0, 135.0, 123.0, 101.0, 66.0, 36.0, 25.0, 16.0, 16.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315673828125, -0.2962226867675781, -0.27677154541015625, -0.2573204040527344, -0.2378692626953125, -0.21841812133789062, -0.19896697998046875, -0.17951583862304688, -0.160064697265625, -0.14061355590820312, -0.12116241455078125, -0.10171127319335938, -0.0822601318359375, -0.06280899047851562, -0.04335784912109375, -0.023906707763671875, -0.00445556640625, 0.014995574951171875, 0.03444671630859375, 0.053897857666015625, 0.0733489990234375, 0.09280014038085938, 0.11225128173828125, 0.13170242309570312, 0.151153564453125, 0.17060470581054688, 0.19005584716796875, 0.20950698852539062, 0.2289581298828125, 0.24840927124023438, 0.26786041259765625, 0.2873115539550781, 0.3067626953125, 0.3262138366699219, 0.34566497802734375, 0.3651161193847656, 0.3845672607421875, 0.4040184020996094, 0.42346954345703125, 0.4429206848144531, 0.462371826171875, 0.4818229675292969, 0.5012741088867188, 0.5207252502441406, 0.5401763916015625, 0.5596275329589844, 0.5790786743164062, 0.5985298156738281, 0.61798095703125, 0.6374320983886719, 0.6568832397460938, 0.6763343811035156, 0.6957855224609375, 0.7152366638183594, 0.7346878051757812, 0.7541389465332031, 0.773590087890625, 0.7930412292480469, 0.8124923706054688, 0.8319435119628906, 0.8513946533203125, 0.8708457946777344, 0.8902969360351562, 0.9097480773925781, 0.92919921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 9.0, 11.0, 23.0, 25.0, 21.0, 37.0, 50.0, 57.0, 148.0, 378.0, 1486.0, 6715.0, 44057.0, 3758659.0, 360516.0, 17612.0, 3059.0, 711.0, 212.0, 120.0, 69.0, 66.0, 60.0, 40.0, 39.0, 34.0, 23.0, 15.0, 12.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8125, -0.7898025512695312, -0.7671051025390625, -0.7444076538085938, -0.721710205078125, -0.6990127563476562, -0.6763153076171875, -0.6536178588867188, -0.63092041015625, -0.6082229614257812, -0.5855255126953125, -0.5628280639648438, -0.540130615234375, -0.5174331665039062, -0.4947357177734375, -0.47203826904296875, -0.4493408203125, -0.42664337158203125, -0.4039459228515625, -0.38124847412109375, -0.358551025390625, -0.33585357666015625, -0.3131561279296875, -0.29045867919921875, -0.26776123046875, -0.24506378173828125, -0.2223663330078125, -0.19966888427734375, -0.176971435546875, -0.15427398681640625, -0.1315765380859375, -0.10887908935546875, -0.086181640625, -0.06348419189453125, -0.0407867431640625, -0.01808929443359375, 0.004608154296875, 0.02730560302734375, 0.0500030517578125, 0.07270050048828125, 0.09539794921875, 0.11809539794921875, 0.1407928466796875, 0.16349029541015625, 0.186187744140625, 0.20888519287109375, 0.2315826416015625, 0.25428009033203125, 0.2769775390625, 0.29967498779296875, 0.3223724365234375, 0.34506988525390625, 0.367767333984375, 0.39046478271484375, 0.4131622314453125, 0.43585968017578125, 0.45855712890625, 0.48125457763671875, 0.5039520263671875, 0.5266494750976562, 0.549346923828125, 0.5720443725585938, 0.5947418212890625, 0.6174392700195312, 0.64013671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 7.0, 14.0, 20.0, 22.0, 42.0, 96.0, 457.0, 2268.0, 883.0, 150.0, 46.0, 29.0, 15.0, 11.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.493896484375, -0.4601020812988281, -0.42630767822265625, -0.3925132751464844, -0.3587188720703125, -0.3249244689941406, -0.29113006591796875, -0.2573356628417969, -0.223541259765625, -0.18974685668945312, -0.15595245361328125, -0.12215805053710938, -0.0883636474609375, -0.054569244384765625, -0.02077484130859375, 0.013019561767578125, 0.04681396484375, 0.08060836791992188, 0.11440277099609375, 0.14819717407226562, 0.1819915771484375, 0.21578598022460938, 0.24958038330078125, 0.2833747863769531, 0.317169189453125, 0.3509635925292969, 0.38475799560546875, 0.4185523986816406, 0.4523468017578125, 0.4861412048339844, 0.5199356079101562, 0.5537300109863281, 0.5875244140625, 0.6213188171386719, 0.6551132202148438, 0.6889076232910156, 0.7227020263671875, 0.7564964294433594, 0.7902908325195312, 0.8240852355957031, 0.857879638671875, 0.8916740417480469, 0.9254684448242188, 0.9592628479003906, 0.9930572509765625, 1.0268516540527344, 1.0606460571289062, 1.0944404602050781, 1.12823486328125, 1.1620292663574219, 1.1958236694335938, 1.2296180725097656, 1.2634124755859375, 1.2972068786621094, 1.3310012817382812, 1.3647956848144531, 1.398590087890625, 1.4323844909667969, 1.4661788940429688, 1.4999732971191406, 1.5337677001953125, 1.5675621032714844, 1.6013565063476562, 1.6351509094238281, 1.6689453125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 27.0, 85.0, 331.0, 327.0, 118.0, 51.0, 21.0, 4.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.815892219543457, -4.636350154876709, -4.456808090209961, -4.277266025543213, -4.097723960876465, -3.918181896209717, -3.7386395931243896, -3.5590975284576416, -3.3795554637908936, -3.2000133991241455, -3.0204713344573975, -2.8409290313720703, -2.6613869667053223, -2.481844902038574, -2.302302837371826, -2.122760772705078, -1.94321870803833, -1.763676643371582, -1.584134578704834, -1.4045923948287964, -1.2250503301620483, -1.0455082654953003, -0.8659660816192627, -0.6864240169525146, -0.5068819522857666, -0.32733985781669617, -0.14779776334762573, 0.03174436092376709, 0.21128642559051514, 0.3908284902572632, 0.5703706741333008, 0.7499127388000488, 0.9294543266296387, 1.1089963912963867, 1.2885384559631348, 1.4680806398391724, 1.6476227045059204, 1.8271647691726685, 2.006706953048706, 2.186249017715454, 2.365791082382202, 2.54533314704895, 2.7248752117156982, 2.9044175148010254, 3.0839595794677734, 3.2635016441345215, 3.4430437088012695, 3.6225857734680176, 3.8021278381347656, 3.9816699028015137, 4.161211967468262, 4.34075403213501, 4.520296096801758, 4.699838161468506, 4.879380226135254, 5.05892276763916, 5.23846435546875, 5.418006420135498, 5.597548484802246, 5.777090549468994, 5.956632614135742, 6.13617467880249, 6.315716743469238, 6.4952592849731445, 6.674801349639893]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 4.0, 6.0, 12.0, 15.0, 22.0, 35.0, 44.0, 47.0, 56.0, 73.0, 69.0, 97.0, 80.0, 60.0, 70.0, 79.0, 45.0, 54.0, 41.0, 25.0, 24.0, 8.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6425580978393555, -4.530004501342773, -4.417450904846191, -4.304897308349609, -4.192343711853027, -4.079790115356445, -3.967236280441284, -3.854682683944702, -3.74212908744812, -3.629575490951538, -3.517021894454956, -3.404468297958374, -3.291914463043213, -3.179360866546631, -3.066807270050049, -2.954253673553467, -2.8417000770568848, -2.7291464805603027, -2.6165928840637207, -2.5040392875671387, -2.3914856910705566, -2.2789320945739746, -2.1663782596588135, -2.0538246631622314, -1.9412710666656494, -1.8287174701690674, -1.7161638736724854, -1.6036101579666138, -1.4910565614700317, -1.3785029649734497, -1.2659492492675781, -1.153395652770996, -1.040842056274414, -0.928288459777832, -0.8157348036766052, -0.7031811475753784, -0.5906275510787964, -0.47807395458221436, -0.36552029848098755, -0.25296664237976074, -0.1404130458831787, -0.027859419584274292, 0.08469420671463013, 0.19724783301353455, 0.30980145931243896, 0.422355055809021, 0.5349087119102478, 0.6474623680114746, 0.7600159645080566, 0.8725695610046387, 0.9851232171058655, 1.0976768732070923, 1.2102304697036743, 1.3227840662002563, 1.435337781906128, 1.54789137840271, 1.660444974899292, 1.772998571395874, 1.885552167892456, 1.9981058835983276, 2.110659599304199, 2.2232131958007812, 2.3357667922973633, 2.4483203887939453, 2.5608739852905273]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 11.0, 17.0, 42.0, 36.0, 76.0, 107.0, 162.0, 304.0, 520.0, 1042.0, 2210.0, 5132.0, 14156.0, 47593.0, 202681.0, 527691.0, 181051.0, 43377.0, 13136.0, 4888.0, 2047.0, 997.0, 498.0, 313.0, 168.0, 95.0, 52.0, 45.0, 38.0, 15.0, 13.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.385986328125, -0.374786376953125, -0.36358642578125, -0.352386474609375, -0.3411865234375, -0.329986572265625, -0.31878662109375, -0.307586669921875, -0.29638671875, -0.285186767578125, -0.27398681640625, -0.262786865234375, -0.2515869140625, -0.240386962890625, -0.22918701171875, -0.217987060546875, -0.206787109375, -0.195587158203125, -0.18438720703125, -0.173187255859375, -0.1619873046875, -0.150787353515625, -0.13958740234375, -0.128387451171875, -0.1171875, -0.105987548828125, -0.09478759765625, -0.083587646484375, -0.0723876953125, -0.061187744140625, -0.04998779296875, -0.038787841796875, -0.027587890625, -0.016387939453125, -0.00518798828125, 0.006011962890625, 0.0172119140625, 0.028411865234375, 0.03961181640625, 0.050811767578125, 0.06201171875, 0.073211669921875, 0.08441162109375, 0.095611572265625, 0.1068115234375, 0.118011474609375, 0.12921142578125, 0.140411376953125, 0.151611328125, 0.162811279296875, 0.17401123046875, 0.185211181640625, 0.1964111328125, 0.207611083984375, 0.21881103515625, 0.230010986328125, 0.2412109375, 0.252410888671875, 0.26361083984375, 0.274810791015625, 0.2860107421875, 0.297210693359375, 0.30841064453125, 0.319610595703125, 0.330810546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 16.0, 10.0, 13.0, 16.0, 20.0, 39.0, 41.0, 37.0, 54.0, 50.0, 67.0, 80.0, 81.0, 73.0, 62.0, 52.0, 65.0, 42.0, 51.0, 28.0, 30.0, 14.0, 14.0, 6.0, 10.0, 10.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28662109375, -0.27581787109375, -0.2650146484375, -0.25421142578125, -0.243408203125, -0.23260498046875, -0.2218017578125, -0.21099853515625, -0.2001953125, -0.18939208984375, -0.1785888671875, -0.16778564453125, -0.156982421875, -0.14617919921875, -0.1353759765625, -0.12457275390625, -0.11376953125, -0.10296630859375, -0.0921630859375, -0.08135986328125, -0.070556640625, -0.05975341796875, -0.0489501953125, -0.03814697265625, -0.02734375, -0.01654052734375, -0.0057373046875, 0.00506591796875, 0.015869140625, 0.02667236328125, 0.0374755859375, 0.04827880859375, 0.05908203125, 0.06988525390625, 0.0806884765625, 0.09149169921875, 0.102294921875, 0.11309814453125, 0.1239013671875, 0.13470458984375, 0.1455078125, 0.15631103515625, 0.1671142578125, 0.17791748046875, 0.188720703125, 0.19952392578125, 0.2103271484375, 0.22113037109375, 0.23193359375, 0.24273681640625, 0.2535400390625, 0.26434326171875, 0.275146484375, 0.28594970703125, 0.2967529296875, 0.30755615234375, 0.318359375, 0.32916259765625, 0.3399658203125, 0.35076904296875, 0.361572265625, 0.37237548828125, 0.3831787109375, 0.39398193359375, 0.40478515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 3.0, 4.0, 7.0, 12.0, 32.0, 40.0, 71.0, 171.0, 346.0, 1009.0, 4090.0, 196917.0, 836352.0, 7293.0, 1322.0, 472.0, 197.0, 92.0, 40.0, 30.0, 9.0, 13.0, 6.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.63671875, -1.5887603759765625, -1.540802001953125, -1.4928436279296875, -1.44488525390625, -1.3969268798828125, -1.348968505859375, -1.3010101318359375, -1.2530517578125, -1.2050933837890625, -1.157135009765625, -1.1091766357421875, -1.06121826171875, -1.0132598876953125, -0.965301513671875, -0.9173431396484375, -0.869384765625, -0.8214263916015625, -0.773468017578125, -0.7255096435546875, -0.67755126953125, -0.6295928955078125, -0.581634521484375, -0.5336761474609375, -0.4857177734375, -0.4377593994140625, -0.389801025390625, -0.3418426513671875, -0.29388427734375, -0.2459259033203125, -0.197967529296875, -0.1500091552734375, -0.10205078125, -0.0540924072265625, -0.006134033203125, 0.0418243408203125, 0.08978271484375, 0.1377410888671875, 0.185699462890625, 0.2336578369140625, 0.2816162109375, 0.3295745849609375, 0.377532958984375, 0.4254913330078125, 0.47344970703125, 0.5214080810546875, 0.569366455078125, 0.6173248291015625, 0.665283203125, 0.7132415771484375, 0.761199951171875, 0.8091583251953125, 0.85711669921875, 0.9050750732421875, 0.953033447265625, 1.0009918212890625, 1.0489501953125, 1.0969085693359375, 1.144866943359375, 1.1928253173828125, 1.24078369140625, 1.2887420654296875, 1.336700439453125, 1.3846588134765625, 1.4326171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 18.0, 30.0, 45.0, 93.0, 122.0, 126.0, 144.0, 143.0, 101.0, 70.0, 48.0, 27.0, 18.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.283203125, -3.1998291015625, -3.116455078125, -3.0330810546875, -2.94970703125, -2.8663330078125, -2.782958984375, -2.6995849609375, -2.6162109375, -2.5328369140625, -2.449462890625, -2.3660888671875, -2.28271484375, -2.1993408203125, -2.115966796875, -2.0325927734375, -1.94921875, -1.8658447265625, -1.782470703125, -1.6990966796875, -1.61572265625, -1.5323486328125, -1.448974609375, -1.3656005859375, -1.2822265625, -1.1988525390625, -1.115478515625, -1.0321044921875, -0.94873046875, -0.8653564453125, -0.781982421875, -0.6986083984375, -0.615234375, -0.5318603515625, -0.448486328125, -0.3651123046875, -0.28173828125, -0.1983642578125, -0.114990234375, -0.0316162109375, 0.0517578125, 0.1351318359375, 0.218505859375, 0.3018798828125, 0.38525390625, 0.4686279296875, 0.552001953125, 0.6353759765625, 0.71875, 0.8021240234375, 0.885498046875, 0.9688720703125, 1.05224609375, 1.1356201171875, 1.218994140625, 1.3023681640625, 1.3857421875, 1.4691162109375, 1.552490234375, 1.6358642578125, 1.71923828125, 1.8026123046875, 1.885986328125, 1.9693603515625, 2.052734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 8.0, 8.0, 7.0, 13.0, 23.0, 25.0, 39.0, 72.0, 129.0, 309.0, 1311.0, 16288.0, 989643.0, 37973.0, 1907.0, 409.0, 166.0, 82.0, 41.0, 35.0, 17.0, 9.0, 11.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47021484375, -0.45377349853515625, -0.4373321533203125, -0.42089080810546875, -0.404449462890625, -0.38800811767578125, -0.3715667724609375, -0.35512542724609375, -0.33868408203125, -0.32224273681640625, -0.3058013916015625, -0.28936004638671875, -0.272918701171875, -0.25647735595703125, -0.2400360107421875, -0.22359466552734375, -0.2071533203125, -0.19071197509765625, -0.1742706298828125, -0.15782928466796875, -0.141387939453125, -0.12494659423828125, -0.1085052490234375, -0.09206390380859375, -0.07562255859375, -0.05918121337890625, -0.0427398681640625, -0.02629852294921875, -0.009857177734375, 0.00658416748046875, 0.0230255126953125, 0.03946685791015625, 0.055908203125, 0.07234954833984375, 0.0887908935546875, 0.10523223876953125, 0.121673583984375, 0.13811492919921875, 0.1545562744140625, 0.17099761962890625, 0.18743896484375, 0.20388031005859375, 0.2203216552734375, 0.23676300048828125, 0.253204345703125, 0.26964569091796875, 0.2860870361328125, 0.30252838134765625, 0.3189697265625, 0.33541107177734375, 0.3518524169921875, 0.36829376220703125, 0.384735107421875, 0.40117645263671875, 0.4176177978515625, 0.43405914306640625, 0.45050048828125, 0.46694183349609375, 0.4833831787109375, 0.49982452392578125, 0.516265869140625, 0.5327072143554688, 0.5491485595703125, 0.5655899047851562, 0.58203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 6.0, 4.0, 5.0, 3.0, 5.0, 2.0, 6.0, 7.0, 11.0, 8.0, 9.0, 20.0, 27.0, 27.0, 49.0, 98.0, 122.0, 173.0, 140.0, 99.0, 50.0, 37.0, 16.0, 15.0, 15.0, 8.0, 8.0, 9.0, 2.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.423494338989258e-05, -9.103305637836456e-05, -8.783116936683655e-05, -8.462928235530853e-05, -8.142739534378052e-05, -7.82255083322525e-05, -7.502362132072449e-05, -7.182173430919647e-05, -6.861984729766846e-05, -6.541796028614044e-05, -6.221607327461243e-05, -5.901418626308441e-05, -5.5812299251556396e-05, -5.261041224002838e-05, -4.9408525228500366e-05, -4.620663821697235e-05, -4.3004751205444336e-05, -3.980286419391632e-05, -3.6600977182388306e-05, -3.339909017086029e-05, -3.0197203159332275e-05, -2.699531614780426e-05, -2.3793429136276245e-05, -2.059154212474823e-05, -1.7389655113220215e-05, -1.41877681016922e-05, -1.0985881090164185e-05, -7.78399407863617e-06, -4.582107067108154e-06, -1.3802200555801392e-06, 1.821666955947876e-06, 5.023553967475891e-06, 8.225440979003906e-06, 1.1427327990531921e-05, 1.4629215002059937e-05, 1.783110201358795e-05, 2.1032989025115967e-05, 2.4234876036643982e-05, 2.7436763048171997e-05, 3.063865005970001e-05, 3.384053707122803e-05, 3.704242408275604e-05, 4.024431109428406e-05, 4.344619810581207e-05, 4.664808511734009e-05, 4.98499721288681e-05, 5.305185914039612e-05, 5.625374615192413e-05, 5.945563316345215e-05, 6.265752017498016e-05, 6.585940718650818e-05, 6.90612941980362e-05, 7.226318120956421e-05, 7.546506822109222e-05, 7.866695523262024e-05, 8.186884224414825e-05, 8.507072925567627e-05, 8.827261626720428e-05, 9.14745032787323e-05, 9.467639029026031e-05, 9.787827730178833e-05, 0.00010108016431331635, 0.00010428205132484436, 0.00010748393833637238, 0.00011068582534790039]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 18.0, 19.0, 23.0, 35.0, 54.0, 84.0, 158.0, 310.0, 699.0, 1984.0, 10839.0, 240039.0, 766955.0, 22399.0, 3153.0, 899.0, 392.0, 180.0, 117.0, 73.0, 41.0, 21.0, 17.0, 12.0, 12.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2479248046875, -0.2380695343017578, -0.22821426391601562, -0.21835899353027344, -0.20850372314453125, -0.19864845275878906, -0.18879318237304688, -0.1789379119873047, -0.1690826416015625, -0.1592273712158203, -0.14937210083007812, -0.13951683044433594, -0.12966156005859375, -0.11980628967285156, -0.10995101928710938, -0.10009574890136719, -0.090240478515625, -0.08038520812988281, -0.07052993774414062, -0.06067466735839844, -0.05081939697265625, -0.04096412658691406, -0.031108856201171875, -0.021253585815429688, -0.0113983154296875, -0.0015430450439453125, 0.008312225341796875, 0.018167495727539062, 0.02802276611328125, 0.03787803649902344, 0.047733306884765625, 0.05758857727050781, 0.06744384765625, 0.07729911804199219, 0.08715438842773438, 0.09700965881347656, 0.10686492919921875, 0.11672019958496094, 0.12657546997070312, 0.1364307403564453, 0.1462860107421875, 0.1561412811279297, 0.16599655151367188, 0.17585182189941406, 0.18570709228515625, 0.19556236267089844, 0.20541763305664062, 0.2152729034423828, 0.225128173828125, 0.2349834442138672, 0.24483871459960938, 0.25469398498535156, 0.26454925537109375, 0.27440452575683594, 0.2842597961425781, 0.2941150665283203, 0.3039703369140625, 0.3138256072998047, 0.3236808776855469, 0.33353614807128906, 0.34339141845703125, 0.35324668884277344, 0.3631019592285156, 0.3729572296142578, 0.3828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 2.0, 0.0, 4.0, 7.0, 6.0, 2.0, 7.0, 8.0, 16.0, 13.0, 23.0, 20.0, 31.0, 41.0, 61.0, 53.0, 70.0, 81.0, 110.0, 81.0, 75.0, 77.0, 54.0, 30.0, 24.0, 22.0, 21.0, 18.0, 7.0, 10.0, 2.0, 2.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2054443359375, -0.1993122100830078, -0.19318008422851562, -0.18704795837402344, -0.18091583251953125, -0.17478370666503906, -0.16865158081054688, -0.1625194549560547, -0.1563873291015625, -0.1502552032470703, -0.14412307739257812, -0.13799095153808594, -0.13185882568359375, -0.12572669982910156, -0.11959457397460938, -0.11346244812011719, -0.107330322265625, -0.10119819641113281, -0.09506607055664062, -0.08893394470214844, -0.08280181884765625, -0.07666969299316406, -0.07053756713867188, -0.06440544128417969, -0.0582733154296875, -0.05214118957519531, -0.046009063720703125, -0.03987693786621094, -0.03374481201171875, -0.027612686157226562, -0.021480560302734375, -0.015348434448242188, -0.00921630859375, -0.0030841827392578125, 0.003047943115234375, 0.009180068969726562, 0.01531219482421875, 0.021444320678710938, 0.027576446533203125, 0.03370857238769531, 0.0398406982421875, 0.04597282409667969, 0.052104949951171875, 0.05823707580566406, 0.06436920166015625, 0.07050132751464844, 0.07663345336914062, 0.08276557922363281, 0.088897705078125, 0.09502983093261719, 0.10116195678710938, 0.10729408264160156, 0.11342620849609375, 0.11955833435058594, 0.12569046020507812, 0.1318225860595703, 0.1379547119140625, 0.1440868377685547, 0.15021896362304688, 0.15635108947753906, 0.16248321533203125, 0.16861534118652344, 0.17474746704101562, 0.1808795928955078, 0.18701171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 10.0, 5.0, 13.0, 122.0, 668.0, 156.0, 21.0, 9.0, 1.0, 2.0, 1.0, 2.0], "bins": [-26.998016357421875, -26.521320343017578, -26.04462242126465, -25.56792640686035, -25.091230392456055, -24.614534378051758, -24.137836456298828, -23.66114044189453, -23.184444427490234, -22.707748413085938, -22.231050491333008, -21.75435447692871, -21.277658462524414, -20.800962448120117, -20.324264526367188, -19.84756851196289, -19.370872497558594, -18.894176483154297, -18.417478561401367, -17.94078254699707, -17.464086532592773, -16.987390518188477, -16.510692596435547, -16.03399658203125, -15.55729866027832, -15.080601692199707, -14.60390567779541, -14.127208709716797, -13.6505126953125, -13.173815727233887, -12.697118759155273, -12.220422744750977, -11.743725776672363, -11.26702880859375, -10.790332794189453, -10.31363582611084, -9.836939811706543, -9.36024284362793, -8.883546829223633, -8.40684986114502, -7.9301533699035645, -7.453456878662109, -6.976760387420654, -6.500063896179199, -6.023366928100586, -5.546670913696289, -5.069973945617676, -4.593277454376221, -4.116580963134766, -3.6398844718933105, -3.1631879806518555, -2.6864912509918213, -2.209794759750366, -1.7330982685089111, -1.256401538848877, -0.7797050476074219, -0.3030085563659668, 0.17368799448013306, 0.6503845453262329, 1.1270811557769775, 1.6037776470184326, 2.0804741382598877, 2.557170867919922, 3.033867359161377, 3.510563850402832]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 21.0, 25.0, 26.0, 39.0, 67.0, 70.0, 77.0, 98.0, 119.0, 105.0, 71.0, 62.0, 56.0, 43.0, 36.0, 27.0, 14.0, 13.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.415787696838379, -7.1360368728637695, -6.856285572052002, -6.576534748077393, -6.296783447265625, -6.017032623291016, -5.737281799316406, -5.457530498504639, -5.177779197692871, -4.898028373718262, -4.618277072906494, -4.338526248931885, -4.058774948120117, -3.779024124145508, -3.4992730617523193, -3.219521999359131, -2.9397711753845215, -2.660020112991333, -2.3802690505981445, -2.100518226623535, -1.8207670450210571, -1.5410159826278687, -1.2612650394439697, -0.9815139770507812, -0.7017629146575928, -0.4220118820667267, -0.1422608494758606, 0.1374901533126831, 0.4172412157058716, 0.6969922780990601, 0.976743221282959, 1.2564942836761475, 1.536245346069336, 1.8159964084625244, 2.095747470855713, 2.3754982948303223, 2.65524959564209, 2.935000419616699, 3.2147514820098877, 3.494502544403076, 3.7742536067962646, 4.054004669189453, 4.3337554931640625, 4.61350679397583, 4.8932576179504395, 5.173008918762207, 5.452759742736816, 5.732510566711426, 6.012261867523193, 6.292012691497803, 6.57176399230957, 6.85151481628418, 7.131266117095947, 7.411016941070557, 7.690768241882324, 7.970519065856934, 8.250269889831543, 8.530020713806152, 8.809771537780762, 9.089523315429688, 9.369274139404297, 9.649024963378906, 9.928775787353516, 10.208526611328125, 10.48827838897705]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 24.0, 28.0, 36.0, 51.0, 99.0, 166.0, 275.0, 457.0, 849.0, 1675.0, 3999.0, 10788.0, 41336.0, 343174.0, 2739414.0, 942847.0, 83579.0, 15686.0, 5074.0, 2144.0, 1051.0, 571.0, 336.0, 212.0, 136.0, 82.0, 61.0, 34.0, 25.0, 16.0, 12.0, 7.0, 6.0, 3.0, 3.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.192169189453125, -0.18438720703125, -0.176605224609375, -0.1688232421875, -0.161041259765625, -0.15325927734375, -0.145477294921875, -0.1376953125, -0.129913330078125, -0.12213134765625, -0.114349365234375, -0.1065673828125, -0.098785400390625, -0.09100341796875, -0.083221435546875, -0.075439453125, -0.067657470703125, -0.05987548828125, -0.052093505859375, -0.0443115234375, -0.036529541015625, -0.02874755859375, -0.020965576171875, -0.01318359375, -0.005401611328125, 0.00238037109375, 0.010162353515625, 0.0179443359375, 0.025726318359375, 0.03350830078125, 0.041290283203125, 0.049072265625, 0.056854248046875, 0.06463623046875, 0.072418212890625, 0.0802001953125, 0.087982177734375, 0.09576416015625, 0.103546142578125, 0.111328125, 0.119110107421875, 0.12689208984375, 0.134674072265625, 0.1424560546875, 0.150238037109375, 0.15802001953125, 0.165802001953125, 0.173583984375, 0.181365966796875, 0.18914794921875, 0.196929931640625, 0.2047119140625, 0.212493896484375, 0.22027587890625, 0.228057861328125, 0.23583984375, 0.243621826171875, 0.25140380859375, 0.259185791015625, 0.2669677734375, 0.274749755859375, 0.28253173828125, 0.290313720703125, 0.298095703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 10.0, 6.0, 16.0, 16.0, 17.0, 17.0, 40.0, 45.0, 43.0, 42.0, 49.0, 50.0, 66.0, 55.0, 68.0, 53.0, 66.0, 58.0, 53.0, 45.0, 31.0, 40.0, 38.0, 20.0, 15.0, 6.0, 8.0, 9.0, 6.0, 6.0, 1.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.23091697692871094, -0.22245407104492188, -0.2139911651611328, -0.20552825927734375, -0.1970653533935547, -0.18860244750976562, -0.18013954162597656, -0.1716766357421875, -0.16321372985839844, -0.15475082397460938, -0.1462879180908203, -0.13782501220703125, -0.1293621063232422, -0.12089920043945312, -0.11243629455566406, -0.103973388671875, -0.09551048278808594, -0.08704757690429688, -0.07858467102050781, -0.07012176513671875, -0.06165885925292969, -0.053195953369140625, -0.04473304748535156, -0.0362701416015625, -0.027807235717773438, -0.019344329833984375, -0.010881423950195312, -0.00241851806640625, 0.0060443878173828125, 0.014507293701171875, 0.022970199584960938, 0.03143310546875, 0.03989601135253906, 0.048358917236328125, 0.05682182312011719, 0.06528472900390625, 0.07374763488769531, 0.08221054077148438, 0.09067344665527344, 0.0991363525390625, 0.10759925842285156, 0.11606216430664062, 0.12452507019042969, 0.13298797607421875, 0.1414508819580078, 0.14991378784179688, 0.15837669372558594, 0.166839599609375, 0.17530250549316406, 0.18376541137695312, 0.1922283172607422, 0.20069122314453125, 0.2091541290283203, 0.21761703491210938, 0.22607994079589844, 0.2345428466796875, 0.24300575256347656, 0.2514686584472656, 0.2599315643310547, 0.26839447021484375, 0.2768573760986328, 0.2853202819824219, 0.29378318786621094, 0.30224609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 2.0, 6.0, 10.0, 6.0, 17.0, 25.0, 30.0, 51.0, 61.0, 120.0, 189.0, 306.0, 642.0, 1488.0, 3878.0, 13195.0, 61977.0, 902355.0, 3074858.0, 107887.0, 18558.0, 5176.0, 1772.0, 780.0, 376.0, 181.0, 97.0, 67.0, 51.0, 28.0, 24.0, 22.0, 14.0, 12.0, 5.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3577728271484375, -0.346649169921875, -0.3355255126953125, -0.32440185546875, -0.3132781982421875, -0.302154541015625, -0.2910308837890625, -0.2799072265625, -0.2687835693359375, -0.257659912109375, -0.2465362548828125, -0.23541259765625, -0.2242889404296875, -0.213165283203125, -0.2020416259765625, -0.19091796875, -0.1797943115234375, -0.168670654296875, -0.1575469970703125, -0.14642333984375, -0.1352996826171875, -0.124176025390625, -0.1130523681640625, -0.1019287109375, -0.0908050537109375, -0.079681396484375, -0.0685577392578125, -0.05743408203125, -0.0463104248046875, -0.035186767578125, -0.0240631103515625, -0.012939453125, -0.0018157958984375, 0.009307861328125, 0.0204315185546875, 0.03155517578125, 0.0426788330078125, 0.053802490234375, 0.0649261474609375, 0.0760498046875, 0.0871734619140625, 0.098297119140625, 0.1094207763671875, 0.12054443359375, 0.1316680908203125, 0.142791748046875, 0.1539154052734375, 0.1650390625, 0.1761627197265625, 0.187286376953125, 0.1984100341796875, 0.20953369140625, 0.2206573486328125, 0.231781005859375, 0.2429046630859375, 0.2540283203125, 0.2651519775390625, 0.276275634765625, 0.2873992919921875, 0.29852294921875, 0.3096466064453125, 0.320770263671875, 0.3318939208984375, 0.343017578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 7.0, 12.0, 16.0, 19.0, 23.0, 45.0, 42.0, 80.0, 139.0, 300.0, 676.0, 1110.0, 872.0, 353.0, 141.0, 88.0, 40.0, 25.0, 21.0, 14.0, 11.0, 6.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.5779876708984375, -0.561248779296875, -0.5445098876953125, -0.52777099609375, -0.5110321044921875, -0.494293212890625, -0.4775543212890625, -0.4608154296875, -0.4440765380859375, -0.427337646484375, -0.4105987548828125, -0.39385986328125, -0.3771209716796875, -0.360382080078125, -0.3436431884765625, -0.326904296875, -0.3101654052734375, -0.293426513671875, -0.2766876220703125, -0.25994873046875, -0.2432098388671875, -0.226470947265625, -0.2097320556640625, -0.1929931640625, -0.1762542724609375, -0.159515380859375, -0.1427764892578125, -0.12603759765625, -0.1092987060546875, -0.092559814453125, -0.0758209228515625, -0.05908203125, -0.0423431396484375, -0.025604248046875, -0.0088653564453125, 0.00787353515625, 0.0246124267578125, 0.041351318359375, 0.0580902099609375, 0.0748291015625, 0.0915679931640625, 0.108306884765625, 0.1250457763671875, 0.14178466796875, 0.1585235595703125, 0.175262451171875, 0.1920013427734375, 0.208740234375, 0.2254791259765625, 0.242218017578125, 0.2589569091796875, 0.27569580078125, 0.2924346923828125, 0.309173583984375, 0.3259124755859375, 0.3426513671875, 0.3593902587890625, 0.376129150390625, 0.3928680419921875, 0.40960693359375, 0.4263458251953125, 0.443084716796875, 0.4598236083984375, 0.4765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 11.0, 51.0, 413.0, 455.0, 43.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.742006301879883, -6.437751293182373, -6.133496284484863, -5.829241752624512, -5.524986743927002, -5.220731735229492, -4.916477203369141, -4.612222194671631, -4.307967185974121, -4.003712177276611, -3.6994574069976807, -3.39520263671875, -3.0909476280212402, -2.7866926193237305, -2.4824378490448, -2.178183078765869, -1.8739280700683594, -1.5696731805801392, -1.265418291091919, -0.9611634016036987, -0.6569085121154785, -0.3526536226272583, -0.048398733139038086, 0.2558560371398926, 0.5601110458374023, 0.8643659353256226, 1.1686208248138428, 1.472875714302063, 1.7771306037902832, 2.081385612487793, 2.3856403827667236, 2.6898951530456543, 2.994150161743164, 3.298405170440674, 3.6026599407196045, 3.906914710998535, 4.211169719696045, 4.515424728393555, 4.819679260253906, 5.123934268951416, 5.428189277648926, 5.7324442863464355, 6.036699295043945, 6.340953826904297, 6.645208835601807, 6.949463844299316, 7.253718376159668, 7.557973384857178, 7.8622283935546875, 8.166482925415039, 8.470738410949707, 8.774992942810059, 9.079248428344727, 9.383502960205078, 9.68775749206543, 9.992012023925781, 10.29626750946045, 10.6005220413208, 10.904777526855469, 11.20903205871582, 11.513286590576172, 11.81754207611084, 12.121796607971191, 12.42605209350586, 12.730306625366211]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 9.0, 15.0, 16.0, 19.0, 23.0, 22.0, 26.0, 49.0, 42.0, 48.0, 47.0, 55.0, 68.0, 63.0, 63.0, 53.0, 53.0, 48.0, 39.0, 29.0, 33.0, 33.0, 22.0, 14.0, 23.0, 22.0, 11.0, 12.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.8203125, -2.743502140045166, -2.666692018508911, -2.589881658554077, -2.513071298599243, -2.4362611770629883, -2.3594508171081543, -2.2826404571533203, -2.2058303356170654, -2.1290199756622314, -2.0522098541259766, -1.9753994941711426, -1.8985892534255981, -1.8217790126800537, -1.7449686527252197, -1.6681584119796753, -1.5913480520248413, -1.5145378112792969, -1.437727451324463, -1.3609172105789185, -1.284106969833374, -1.20729660987854, -1.1304863691329956, -1.0536761283874512, -0.976865828037262, -0.9000555276870728, -0.8232452869415283, -0.7464349865913391, -0.6696246862411499, -0.5928144454956055, -0.5160041451454163, -0.4391939043998718, -0.3623836040496826, -0.2855733335018158, -0.20876304805278778, -0.13195276260375977, -0.055142492055892944, 0.021667778491973877, 0.09847807884216309, 0.17528831958770752, 0.25209861993789673, 0.32890889048576355, 0.40571916103363037, 0.4825294613838196, 0.5593397617340088, 0.6361500024795532, 0.7129603028297424, 0.7897705435752869, 0.8665808439254761, 0.9433911442756653, 1.0202014446258545, 1.097011685371399, 1.1738219261169434, 1.2506322860717773, 1.3274425268173218, 1.4042527675628662, 1.4810631275177002, 1.5578733682632446, 1.6346837282180786, 1.711493968963623, 1.7883042097091675, 1.865114450454712, 1.941924810409546, 2.018734931945801, 2.0955452919006348]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 9.0, 23.0, 28.0, 49.0, 63.0, 122.0, 251.0, 576.0, 1128.0, 2526.0, 6484.0, 18139.0, 60105.0, 212759.0, 434005.0, 219133.0, 62594.0, 18981.0, 6649.0, 2644.0, 1138.0, 538.0, 264.0, 150.0, 83.0, 35.0, 30.0, 17.0, 13.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.279296875, -0.2720451354980469, -0.26479339599609375, -0.2575416564941406, -0.2502899169921875, -0.24303817749023438, -0.23578643798828125, -0.22853469848632812, -0.221282958984375, -0.21403121948242188, -0.20677947998046875, -0.19952774047851562, -0.1922760009765625, -0.18502426147460938, -0.17777252197265625, -0.17052078247070312, -0.16326904296875, -0.15601730346679688, -0.14876556396484375, -0.14151382446289062, -0.1342620849609375, -0.12701034545898438, -0.11975860595703125, -0.11250686645507812, -0.105255126953125, -0.09800338745117188, -0.09075164794921875, -0.08349990844726562, -0.0762481689453125, -0.06899642944335938, -0.06174468994140625, -0.054492950439453125, -0.0472412109375, -0.039989471435546875, -0.03273773193359375, -0.025485992431640625, -0.0182342529296875, -0.010982513427734375, -0.00373077392578125, 0.003520965576171875, 0.010772705078125, 0.018024444580078125, 0.02527618408203125, 0.032527923583984375, 0.0397796630859375, 0.047031402587890625, 0.05428314208984375, 0.061534881591796875, 0.06878662109375, 0.07603836059570312, 0.08329010009765625, 0.09054183959960938, 0.0977935791015625, 0.10504531860351562, 0.11229705810546875, 0.11954879760742188, 0.126800537109375, 0.13405227661132812, 0.14130401611328125, 0.14855575561523438, 0.1558074951171875, 0.16305923461914062, 0.17031097412109375, 0.17756271362304688, 0.184814453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 4.0, 10.0, 13.0, 11.0, 14.0, 24.0, 23.0, 33.0, 37.0, 40.0, 47.0, 51.0, 42.0, 63.0, 64.0, 65.0, 62.0, 65.0, 60.0, 48.0, 37.0, 41.0, 27.0, 21.0, 26.0, 15.0, 16.0, 12.0, 7.0, 7.0, 9.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.242431640625, -0.23490333557128906, -0.22737503051757812, -0.2198467254638672, -0.21231842041015625, -0.2047901153564453, -0.19726181030273438, -0.18973350524902344, -0.1822052001953125, -0.17467689514160156, -0.16714859008789062, -0.1596202850341797, -0.15209197998046875, -0.1445636749267578, -0.13703536987304688, -0.12950706481933594, -0.121978759765625, -0.11445045471191406, -0.10692214965820312, -0.09939384460449219, -0.09186553955078125, -0.08433723449707031, -0.07680892944335938, -0.06928062438964844, -0.0617523193359375, -0.05422401428222656, -0.046695709228515625, -0.03916740417480469, -0.03163909912109375, -0.024110794067382812, -0.016582489013671875, -0.009054183959960938, -0.00152587890625, 0.0060024261474609375, 0.013530731201171875, 0.021059036254882812, 0.02858734130859375, 0.03611564636230469, 0.043643951416015625, 0.05117225646972656, 0.0587005615234375, 0.06622886657714844, 0.07375717163085938, 0.08128547668457031, 0.08881378173828125, 0.09634208679199219, 0.10387039184570312, 0.11139869689941406, 0.118927001953125, 0.12645530700683594, 0.13398361206054688, 0.1415119171142578, 0.14904022216796875, 0.1565685272216797, 0.16409683227539062, 0.17162513732910156, 0.1791534423828125, 0.18668174743652344, 0.19421005249023438, 0.2017383575439453, 0.20926666259765625, 0.2167949676513672, 0.22432327270507812, 0.23185157775878906, 0.2393798828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 7.0, 23.0, 23.0, 24.0, 41.0, 49.0, 54.0, 86.0, 104.0, 155.0, 197.0, 263.0, 362.0, 539.0, 977.0, 2155.0, 7831.0, 110065.0, 869469.0, 46473.0, 5273.0, 1727.0, 804.0, 491.0, 362.0, 232.0, 199.0, 128.0, 106.0, 82.0, 48.0, 40.0, 46.0, 19.0, 23.0, 14.0, 5.0, 8.0, 5.0, 8.0, 2.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.61962890625, -0.5992279052734375, -0.578826904296875, -0.5584259033203125, -0.53802490234375, -0.5176239013671875, -0.497222900390625, -0.4768218994140625, -0.4564208984375, -0.4360198974609375, -0.415618896484375, -0.3952178955078125, -0.37481689453125, -0.3544158935546875, -0.334014892578125, -0.3136138916015625, -0.293212890625, -0.2728118896484375, -0.252410888671875, -0.2320098876953125, -0.21160888671875, -0.1912078857421875, -0.170806884765625, -0.1504058837890625, -0.1300048828125, -0.1096038818359375, -0.089202880859375, -0.0688018798828125, -0.04840087890625, -0.0279998779296875, -0.007598876953125, 0.0128021240234375, 0.033203125, 0.0536041259765625, 0.074005126953125, 0.0944061279296875, 0.11480712890625, 0.1352081298828125, 0.155609130859375, 0.1760101318359375, 0.1964111328125, 0.2168121337890625, 0.237213134765625, 0.2576141357421875, 0.27801513671875, 0.2984161376953125, 0.318817138671875, 0.3392181396484375, 0.359619140625, 0.3800201416015625, 0.400421142578125, 0.4208221435546875, 0.44122314453125, 0.4616241455078125, 0.482025146484375, 0.5024261474609375, 0.5228271484375, 0.5432281494140625, 0.563629150390625, 0.5840301513671875, 0.60443115234375, 0.6248321533203125, 0.645233154296875, 0.6656341552734375, 0.68603515625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 5.0, 11.0, 16.0, 20.0, 29.0, 27.0, 35.0, 42.0, 48.0, 47.0, 56.0, 51.0, 66.0, 58.0, 58.0, 53.0, 62.0, 47.0, 39.0, 36.0, 27.0, 32.0, 31.0, 15.0, 21.0, 13.0, 10.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.912109375, -0.8802490234375, -0.848388671875, -0.8165283203125, -0.78466796875, -0.7528076171875, -0.720947265625, -0.6890869140625, -0.6572265625, -0.6253662109375, -0.593505859375, -0.5616455078125, -0.52978515625, -0.4979248046875, -0.466064453125, -0.4342041015625, -0.40234375, -0.3704833984375, -0.338623046875, -0.3067626953125, -0.27490234375, -0.2430419921875, -0.211181640625, -0.1793212890625, -0.1474609375, -0.1156005859375, -0.083740234375, -0.0518798828125, -0.02001953125, 0.0118408203125, 0.043701171875, 0.0755615234375, 0.107421875, 0.1392822265625, 0.171142578125, 0.2030029296875, 0.23486328125, 0.2667236328125, 0.298583984375, 0.3304443359375, 0.3623046875, 0.3941650390625, 0.426025390625, 0.4578857421875, 0.48974609375, 0.5216064453125, 0.553466796875, 0.5853271484375, 0.6171875, 0.6490478515625, 0.680908203125, 0.7127685546875, 0.74462890625, 0.7764892578125, 0.808349609375, 0.8402099609375, 0.8720703125, 0.9039306640625, 0.935791015625, 0.9676513671875, 0.99951171875, 1.0313720703125, 1.063232421875, 1.0950927734375, 1.126953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 12.0, 9.0, 20.0, 29.0, 31.0, 50.0, 68.0, 128.0, 208.0, 384.0, 794.0, 2284.0, 9180.0, 87153.0, 851462.0, 83802.0, 8998.0, 2164.0, 813.0, 352.0, 214.0, 106.0, 71.0, 59.0, 49.0, 29.0, 20.0, 8.0, 12.0, 3.0, 9.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1767578125, -0.17131805419921875, -0.1658782958984375, -0.16043853759765625, -0.154998779296875, -0.14955902099609375, -0.1441192626953125, -0.13867950439453125, -0.13323974609375, -0.12779998779296875, -0.1223602294921875, -0.11692047119140625, -0.111480712890625, -0.10604095458984375, -0.1006011962890625, -0.09516143798828125, -0.0897216796875, -0.08428192138671875, -0.0788421630859375, -0.07340240478515625, -0.067962646484375, -0.06252288818359375, -0.0570831298828125, -0.05164337158203125, -0.04620361328125, -0.04076385498046875, -0.0353240966796875, -0.02988433837890625, -0.024444580078125, -0.01900482177734375, -0.0135650634765625, -0.00812530517578125, -0.002685546875, 0.00275421142578125, 0.0081939697265625, 0.01363372802734375, 0.019073486328125, 0.02451324462890625, 0.0299530029296875, 0.03539276123046875, 0.04083251953125, 0.04627227783203125, 0.0517120361328125, 0.05715179443359375, 0.062591552734375, 0.06803131103515625, 0.0734710693359375, 0.07891082763671875, 0.0843505859375, 0.08979034423828125, 0.0952301025390625, 0.10066986083984375, 0.106109619140625, 0.11154937744140625, 0.1169891357421875, 0.12242889404296875, 0.12786865234375, 0.13330841064453125, 0.1387481689453125, 0.14418792724609375, 0.149627685546875, 0.15506744384765625, 0.1605072021484375, 0.16594696044921875, 0.17138671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 11.0, 17.0, 8.0, 14.0, 22.0, 22.0, 19.0, 28.0, 39.0, 37.0, 80.0, 104.0, 114.0, 105.0, 82.0, 76.0, 37.0, 28.0, 30.0, 23.0, 16.0, 15.0, 13.0, 13.0, 2.0, 5.0, 7.0, 3.0, 3.0, 0.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.455183029174805e-05, -6.225146353244781e-05, -5.995109677314758e-05, -5.765073001384735e-05, -5.535036325454712e-05, -5.304999649524689e-05, -5.0749629735946655e-05, -4.844926297664642e-05, -4.614889621734619e-05, -4.384852945804596e-05, -4.154816269874573e-05, -3.9247795939445496e-05, -3.6947429180145264e-05, -3.464706242084503e-05, -3.23466956615448e-05, -3.0046328902244568e-05, -2.7745962142944336e-05, -2.5445595383644104e-05, -2.3145228624343872e-05, -2.084486186504364e-05, -1.8544495105743408e-05, -1.6244128346443176e-05, -1.3943761587142944e-05, -1.1643394827842712e-05, -9.34302806854248e-06, -7.0426613092422485e-06, -4.742294549942017e-06, -2.4419277906417847e-06, -1.4156103134155273e-07, 2.158805727958679e-06, 4.459172487258911e-06, 6.759539246559143e-06, 9.059906005859375e-06, 1.1360272765159607e-05, 1.3660639524459839e-05, 1.596100628376007e-05, 1.8261373043060303e-05, 2.0561739802360535e-05, 2.2862106561660767e-05, 2.5162473320961e-05, 2.746284008026123e-05, 2.9763206839561462e-05, 3.2063573598861694e-05, 3.4363940358161926e-05, 3.666430711746216e-05, 3.896467387676239e-05, 4.126504063606262e-05, 4.3565407395362854e-05, 4.5865774154663086e-05, 4.816614091396332e-05, 5.046650767326355e-05, 5.276687443256378e-05, 5.5067241191864014e-05, 5.7367607951164246e-05, 5.966797471046448e-05, 6.196834146976471e-05, 6.426870822906494e-05, 6.656907498836517e-05, 6.88694417476654e-05, 7.116980850696564e-05, 7.347017526626587e-05, 7.57705420255661e-05, 7.807090878486633e-05, 8.037127554416656e-05, 8.26716423034668e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 10.0, 1.0, 8.0, 9.0, 14.0, 18.0, 28.0, 32.0, 50.0, 67.0, 103.0, 141.0, 236.0, 409.0, 960.0, 2467.0, 9103.0, 70661.0, 861162.0, 87714.0, 10497.0, 2699.0, 996.0, 439.0, 255.0, 134.0, 112.0, 70.0, 42.0, 33.0, 20.0, 12.0, 12.0, 7.0, 7.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18658828735351562, -0.18067169189453125, -0.17475509643554688, -0.1688385009765625, -0.16292190551757812, -0.15700531005859375, -0.15108871459960938, -0.145172119140625, -0.13925552368164062, -0.13333892822265625, -0.12742233276367188, -0.1215057373046875, -0.11558914184570312, -0.10967254638671875, -0.10375595092773438, -0.09783935546875, -0.09192276000976562, -0.08600616455078125, -0.08008956909179688, -0.0741729736328125, -0.06825637817382812, -0.06233978271484375, -0.056423187255859375, -0.050506591796875, -0.044589996337890625, -0.03867340087890625, -0.032756805419921875, -0.0268402099609375, -0.020923614501953125, -0.01500701904296875, -0.009090423583984375, -0.003173828125, 0.002742767333984375, 0.00865936279296875, 0.014575958251953125, 0.0204925537109375, 0.026409149169921875, 0.03232574462890625, 0.038242340087890625, 0.044158935546875, 0.050075531005859375, 0.05599212646484375, 0.061908721923828125, 0.0678253173828125, 0.07374191284179688, 0.07965850830078125, 0.08557510375976562, 0.09149169921875, 0.09740829467773438, 0.10332489013671875, 0.10924148559570312, 0.1151580810546875, 0.12107467651367188, 0.12699127197265625, 0.13290786743164062, 0.138824462890625, 0.14474105834960938, 0.15065765380859375, 0.15657424926757812, 0.1624908447265625, 0.16840744018554688, 0.17432403564453125, 0.18024063110351562, 0.1861572265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 3.0, 8.0, 12.0, 8.0, 15.0, 19.0, 22.0, 32.0, 42.0, 55.0, 83.0, 73.0, 75.0, 101.0, 96.0, 64.0, 62.0, 43.0, 39.0, 32.0, 23.0, 26.0, 12.0, 13.0, 8.0, 2.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1324462890625, -0.12774085998535156, -0.12303543090820312, -0.11833000183105469, -0.11362457275390625, -0.10891914367675781, -0.10421371459960938, -0.09950828552246094, -0.0948028564453125, -0.09009742736816406, -0.08539199829101562, -0.08068656921386719, -0.07598114013671875, -0.07127571105957031, -0.06657028198242188, -0.06186485290527344, -0.057159423828125, -0.05245399475097656, -0.047748565673828125, -0.04304313659667969, -0.03833770751953125, -0.03363227844238281, -0.028926849365234375, -0.024221420288085938, -0.0195159912109375, -0.014810562133789062, -0.010105133056640625, -0.0053997039794921875, -0.00069427490234375, 0.0040111541748046875, 0.008716583251953125, 0.013422012329101562, 0.01812744140625, 0.022832870483398438, 0.027538299560546875, 0.03224372863769531, 0.03694915771484375, 0.04165458679199219, 0.046360015869140625, 0.05106544494628906, 0.0557708740234375, 0.06047630310058594, 0.06518173217773438, 0.06988716125488281, 0.07459259033203125, 0.07929801940917969, 0.08400344848632812, 0.08870887756347656, 0.093414306640625, 0.09811973571777344, 0.10282516479492188, 0.10753059387207031, 0.11223602294921875, 0.11694145202636719, 0.12164688110351562, 0.12635231018066406, 0.1310577392578125, 0.13576316833496094, 0.14046859741210938, 0.1451740264892578, 0.14987945556640625, 0.1545848846435547, 0.15929031372070312, 0.16399574279785156, 0.168701171875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 13.0, 28.0, 146.0, 511.0, 201.0, 45.0, 21.0, 14.0, 10.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8624258041381836, -2.634716510772705, -2.4070072174072266, -2.179297924041748, -1.9515886306762695, -1.723879337310791, -1.4961700439453125, -1.268460750579834, -1.0407514572143555, -0.813042163848877, -0.5853328704833984, -0.3576235771179199, -0.1299142837524414, 0.09779500961303711, 0.3255043029785156, 0.5532135963439941, 0.7809228897094727, 1.0086321830749512, 1.2363414764404297, 1.4640507698059082, 1.6917600631713867, 1.9194693565368652, 2.1471786499023438, 2.3748879432678223, 2.602597236633301, 2.8303065299987793, 3.058015823364258, 3.2857251167297363, 3.513434410095215, 3.7411437034606934, 3.968852996826172, 4.19656229019165, 4.424271583557129, 4.651980876922607, 4.879690170288086, 5.1073994636535645, 5.335108757019043, 5.5628180503845215, 5.79052734375, 6.0182366371154785, 6.245945930480957, 6.4736552238464355, 6.701364517211914, 6.929073810577393, 7.156783103942871, 7.38449239730835, 7.612201690673828, 7.839910984039307, 8.067620277404785, 8.295330047607422, 8.523038864135742, 8.750747680664062, 8.9784574508667, 9.206167221069336, 9.433876037597656, 9.661584854125977, 9.889294624328613, 10.11700439453125, 10.34471321105957, 10.57242202758789, 10.800131797790527, 11.027841567993164, 11.255550384521484, 11.483259201049805, 11.710968971252441]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 3.0, 8.0, 11.0, 10.0, 12.0, 25.0, 16.0, 28.0, 25.0, 33.0, 36.0, 39.0, 44.0, 37.0, 53.0, 82.0, 82.0, 70.0, 60.0, 51.0, 45.0, 40.0, 29.0, 24.0, 16.0, 11.0, 20.0, 21.0, 20.0, 12.0, 7.0, 8.0, 7.0, 4.0, 3.0, 7.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.527020454406738, -4.412191390991211, -4.297362327575684, -4.182532787322998, -4.067703723907471, -3.9528746604919434, -3.838045597076416, -3.7232162952423096, -3.6083872318267822, -3.493558168411255, -3.3787288665771484, -3.263899803161621, -3.1490705013275146, -3.0342414379119873, -2.919412136077881, -2.8045830726623535, -2.689754009246826, -2.574924945831299, -2.4600956439971924, -2.345266580581665, -2.2304372787475586, -2.1156082153320312, -2.000779151916504, -1.8859498500823975, -1.771120548248291, -1.6562913656234741, -1.5414621829986572, -1.4266331195831299, -1.311803936958313, -1.196974754333496, -1.0821455717086792, -0.9673164486885071, -0.852487325668335, -0.7376581430435181, -0.622829020023346, -0.507999837398529, -0.39317068457603455, -0.27834153175354004, -0.16351234912872314, -0.048683226108551025, 0.06614595651626587, 0.18097510933876038, 0.2958042621612549, 0.4106334447860718, 0.5254626274108887, 0.6402917504310608, 0.7551209330558777, 0.8699500560760498, 0.9847792387008667, 1.0996084213256836, 1.2144376039505005, 1.3292667865753174, 1.4440958499908447, 1.5589250326156616, 1.6737542152404785, 1.7885832786560059, 1.9034125804901123, 2.0182416439056396, 2.133070945739746, 2.2479000091552734, 2.36272931098938, 2.4775583744049072, 2.5923876762390137, 2.707216739654541, 2.8220458030700684]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 2.0, 7.0, 13.0, 14.0, 24.0, 39.0, 42.0, 80.0, 101.0, 176.0, 338.0, 637.0, 1406.0, 3165.0, 8699.0, 30127.0, 190516.0, 1707763.0, 1949170.0, 246779.0, 37120.0, 10003.0, 4015.0, 1908.0, 1012.0, 507.0, 262.0, 121.0, 71.0, 48.0, 35.0, 19.0, 19.0, 7.0, 6.0, 9.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2349853515625, -0.22864341735839844, -0.22230148315429688, -0.2159595489501953, -0.20961761474609375, -0.2032756805419922, -0.19693374633789062, -0.19059181213378906, -0.1842498779296875, -0.17790794372558594, -0.17156600952148438, -0.1652240753173828, -0.15888214111328125, -0.1525402069091797, -0.14619827270507812, -0.13985633850097656, -0.133514404296875, -0.12717247009277344, -0.12083053588867188, -0.11448860168457031, -0.10814666748046875, -0.10180473327636719, -0.09546279907226562, -0.08912086486816406, -0.0827789306640625, -0.07643699645996094, -0.07009506225585938, -0.06375312805175781, -0.05741119384765625, -0.05106925964355469, -0.044727325439453125, -0.03838539123535156, -0.03204345703125, -0.025701522827148438, -0.019359588623046875, -0.013017654418945312, -0.00667572021484375, -0.0003337860107421875, 0.006008148193359375, 0.012350082397460938, 0.0186920166015625, 0.025033950805664062, 0.031375885009765625, 0.03771781921386719, 0.04405975341796875, 0.05040168762207031, 0.056743621826171875, 0.06308555603027344, 0.069427490234375, 0.07576942443847656, 0.08211135864257812, 0.08845329284667969, 0.09479522705078125, 0.10113716125488281, 0.10747909545898438, 0.11382102966308594, 0.1201629638671875, 0.12650489807128906, 0.13284683227539062, 0.1391887664794922, 0.14553070068359375, 0.1518726348876953, 0.15821456909179688, 0.16455650329589844, 0.1708984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 6.0, 8.0, 14.0, 24.0, 38.0, 54.0, 70.0, 79.0, 95.0, 95.0, 121.0, 73.0, 102.0, 83.0, 49.0, 30.0, 30.0, 18.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5141181945800781, -0.5018692016601562, -0.4896202087402344, -0.4773712158203125, -0.4651222229003906, -0.45287322998046875, -0.4406242370605469, -0.428375244140625, -0.4161262512207031, -0.40387725830078125, -0.3916282653808594, -0.3793792724609375, -0.3671302795410156, -0.35488128662109375, -0.3426322937011719, -0.33038330078125, -0.3181343078613281, -0.30588531494140625, -0.2936363220214844, -0.2813873291015625, -0.2691383361816406, -0.25688934326171875, -0.24464035034179688, -0.232391357421875, -0.22014236450195312, -0.20789337158203125, -0.19564437866210938, -0.1833953857421875, -0.17114639282226562, -0.15889739990234375, -0.14664840698242188, -0.1343994140625, -0.12215042114257812, -0.10990142822265625, -0.09765243530273438, -0.0854034423828125, -0.07315444946289062, -0.06090545654296875, -0.048656463623046875, -0.036407470703125, -0.024158477783203125, -0.01190948486328125, 0.000339508056640625, 0.0125885009765625, 0.024837493896484375, 0.03708648681640625, 0.049335479736328125, 0.06158447265625, 0.07383346557617188, 0.08608245849609375, 0.09833145141601562, 0.1105804443359375, 0.12282943725585938, 0.13507843017578125, 0.14732742309570312, 0.159576416015625, 0.17182540893554688, 0.18407440185546875, 0.19632339477539062, 0.2085723876953125, 0.22082138061523438, 0.23307037353515625, 0.24531936645507812, 0.257568359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 9.0, 10.0, 10.0, 20.0, 39.0, 74.0, 138.0, 257.0, 527.0, 954.0, 2175.0, 6902.0, 34552.0, 780462.0, 3288545.0, 67196.0, 8610.0, 2145.0, 753.0, 397.0, 209.0, 110.0, 68.0, 44.0, 24.0, 12.0, 15.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3837890625, -0.3714790344238281, -0.35916900634765625, -0.3468589782714844, -0.3345489501953125, -0.3222389221191406, -0.30992889404296875, -0.2976188659667969, -0.285308837890625, -0.2729988098144531, -0.26068878173828125, -0.24837875366210938, -0.2360687255859375, -0.22375869750976562, -0.21144866943359375, -0.19913864135742188, -0.18682861328125, -0.17451858520507812, -0.16220855712890625, -0.14989852905273438, -0.1375885009765625, -0.12527847290039062, -0.11296844482421875, -0.10065841674804688, -0.088348388671875, -0.07603836059570312, -0.06372833251953125, -0.051418304443359375, -0.0391082763671875, -0.026798248291015625, -0.01448822021484375, -0.002178192138671875, 0.0101318359375, 0.022441864013671875, 0.03475189208984375, 0.047061920166015625, 0.0593719482421875, 0.07168197631835938, 0.08399200439453125, 0.09630203247070312, 0.108612060546875, 0.12092208862304688, 0.13323211669921875, 0.14554214477539062, 0.1578521728515625, 0.17016220092773438, 0.18247222900390625, 0.19478225708007812, 0.20709228515625, 0.21940231323242188, 0.23171234130859375, 0.24402236938476562, 0.2563323974609375, 0.2686424255371094, 0.28095245361328125, 0.2932624816894531, 0.305572509765625, 0.3178825378417969, 0.33019256591796875, 0.3425025939941406, 0.3548126220703125, 0.3671226501464844, 0.37943267822265625, 0.3917427062988281, 0.404052734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 10.0, 19.0, 29.0, 45.0, 76.0, 170.0, 545.0, 1361.0, 1203.0, 376.0, 113.0, 50.0, 26.0, 10.0, 16.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5540847778320312, -0.5334625244140625, -0.5128402709960938, -0.492218017578125, -0.47159576416015625, -0.4509735107421875, -0.43035125732421875, -0.40972900390625, -0.38910675048828125, -0.3684844970703125, -0.34786224365234375, -0.327239990234375, -0.30661773681640625, -0.2859954833984375, -0.26537322998046875, -0.2447509765625, -0.22412872314453125, -0.2035064697265625, -0.18288421630859375, -0.162261962890625, -0.14163970947265625, -0.1210174560546875, -0.10039520263671875, -0.07977294921875, -0.05915069580078125, -0.0385284423828125, -0.01790618896484375, 0.002716064453125, 0.02333831787109375, 0.0439605712890625, 0.06458282470703125, 0.085205078125, 0.10582733154296875, 0.1264495849609375, 0.14707183837890625, 0.167694091796875, 0.18831634521484375, 0.2089385986328125, 0.22956085205078125, 0.25018310546875, 0.27080535888671875, 0.2914276123046875, 0.31204986572265625, 0.332672119140625, 0.35329437255859375, 0.3739166259765625, 0.39453887939453125, 0.4151611328125, 0.43578338623046875, 0.4564056396484375, 0.47702789306640625, 0.497650146484375, 0.5182723999023438, 0.5388946533203125, 0.5595169067382812, 0.58013916015625, 0.6007614135742188, 0.6213836669921875, 0.6420059204101562, 0.662628173828125, 0.6832504272460938, 0.7038726806640625, 0.7244949340820312, 0.7451171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 33.0, 119.0, 372.0, 340.0, 89.0, 14.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.320489883422852, -6.140018939971924, -5.959547996520996, -5.779077053070068, -5.598606109619141, -5.418135166168213, -5.237664222717285, -5.057193279266357, -4.87672233581543, -4.696251392364502, -4.515780448913574, -4.3353095054626465, -4.154838562011719, -3.974367618560791, -3.7938966751098633, -3.6134257316589355, -3.4329545497894287, -3.252483606338501, -3.0720126628875732, -2.8915417194366455, -2.7110707759857178, -2.53059983253479, -2.350128650665283, -2.1696577072143555, -1.9891868829727173, -1.8087159395217896, -1.6282449960708618, -1.4477739334106445, -1.2673029899597168, -1.086832046508789, -0.9063611030578613, -0.7258901596069336, -0.5454192161560059, -0.3649482727050781, -0.184477299451828, -0.004006326198577881, 0.17646461725234985, 0.3569355607032776, 0.5374065637588501, 0.7178775072097778, 0.8983484506607056, 1.0788193941116333, 1.259290337562561, 1.4397614002227783, 1.620232343673706, 1.8007032871246338, 1.9811742305755615, 2.1616451740264893, 2.342116117477417, 2.5225870609283447, 2.7030580043792725, 2.8835289478302, 3.063999891281128, 3.2444708347320557, 3.4249420166015625, 3.6054129600524902, 3.785883903503418, 3.9663548469543457, 4.146825790405273, 4.327296733856201, 4.507767677307129, 4.688238620758057, 4.868709564208984, 5.049180507659912, 5.22965145111084]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 8.0, 15.0, 9.0, 22.0, 20.0, 29.0, 36.0, 54.0, 62.0, 76.0, 82.0, 84.0, 80.0, 76.0, 77.0, 61.0, 54.0, 35.0, 30.0, 23.0, 19.0, 13.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.850261926651001, -1.7613246440887451, -1.6723873615264893, -1.5834500789642334, -1.4945127964019775, -1.4055755138397217, -1.3166381120681763, -1.2277008295059204, -1.1387635469436646, -1.0498262643814087, -0.9608889818191528, -0.8719516396522522, -0.7830143570899963, -0.6940770745277405, -0.6051397323608398, -0.516202449798584, -0.4272651672363281, -0.33832788467407227, -0.24939057230949402, -0.16045325994491577, -0.07151597738265991, 0.017421305179595947, 0.10635864734649658, 0.19529592990875244, 0.2842332124710083, 0.37317049503326416, 0.4621078073978424, 0.5510451197624207, 0.6399824023246765, 0.7289196848869324, 0.817857027053833, 0.9067943096160889, 0.9957313537597656, 1.0846686363220215, 1.1736059188842773, 1.2625432014465332, 1.351480484008789, 1.440417766571045, 1.5293551683425903, 1.6182924509048462, 1.707229733467102, 1.796167016029358, 1.8851042985916138, 1.9740417003631592, 2.062978982925415, 2.151916265487671, 2.2408535480499268, 2.3297908306121826, 2.4187281131744385, 2.5076653957366943, 2.59660267829895, 2.685539960861206, 2.774477243423462, 2.8634145259857178, 2.9523520469665527, 3.0412893295288086, 3.1302266120910645, 3.2191638946533203, 3.308101177215576, 3.397038459777832, 3.485975742340088, 3.5749130249023438, 3.6638503074645996, 3.7527875900268555, 3.8417248725891113]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 6.0, 2.0, 7.0, 7.0, 13.0, 10.0, 31.0, 27.0, 38.0, 67.0, 105.0, 166.0, 291.0, 501.0, 913.0, 1961.0, 4644.0, 12719.0, 39375.0, 139561.0, 403020.0, 310379.0, 92276.0, 26749.0, 8908.0, 3401.0, 1545.0, 740.0, 413.0, 243.0, 130.0, 89.0, 55.0, 40.0, 32.0, 20.0, 20.0, 13.0, 11.0, 11.0, 2.0, 2.0, 5.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.236328125, -0.22866439819335938, -0.22100067138671875, -0.21333694458007812, -0.2056732177734375, -0.19800949096679688, -0.19034576416015625, -0.18268203735351562, -0.175018310546875, -0.16735458374023438, -0.15969085693359375, -0.15202713012695312, -0.1443634033203125, -0.13669967651367188, -0.12903594970703125, -0.12137222290039062, -0.11370849609375, -0.10604476928710938, -0.09838104248046875, -0.09071731567382812, -0.0830535888671875, -0.07538986206054688, -0.06772613525390625, -0.060062408447265625, -0.052398681640625, -0.044734954833984375, -0.03707122802734375, -0.029407501220703125, -0.0217437744140625, -0.014080047607421875, -0.00641632080078125, 0.001247406005859375, 0.0089111328125, 0.016574859619140625, 0.02423858642578125, 0.031902313232421875, 0.0395660400390625, 0.047229766845703125, 0.05489349365234375, 0.06255722045898438, 0.070220947265625, 0.07788467407226562, 0.08554840087890625, 0.09321212768554688, 0.1008758544921875, 0.10853958129882812, 0.11620330810546875, 0.12386703491210938, 0.13153076171875, 0.13919448852539062, 0.14685821533203125, 0.15452194213867188, 0.1621856689453125, 0.16984939575195312, 0.17751312255859375, 0.18517684936523438, 0.192840576171875, 0.20050430297851562, 0.20816802978515625, 0.21583175659179688, 0.2234954833984375, 0.23115921020507812, 0.23882293701171875, 0.24648666381835938, 0.254150390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 1.0, 5.0, 5.0, 6.0, 3.0, 14.0, 10.0, 22.0, 23.0, 35.0, 44.0, 40.0, 50.0, 62.0, 78.0, 64.0, 63.0, 74.0, 62.0, 73.0, 54.0, 34.0, 53.0, 33.0, 28.0, 17.0, 17.0, 11.0, 8.0, 6.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2406005859375, -0.2329540252685547, -0.22530746459960938, -0.21766090393066406, -0.21001434326171875, -0.20236778259277344, -0.19472122192382812, -0.1870746612548828, -0.1794281005859375, -0.1717815399169922, -0.16413497924804688, -0.15648841857910156, -0.14884185791015625, -0.14119529724121094, -0.13354873657226562, -0.1259021759033203, -0.118255615234375, -0.11060905456542969, -0.10296249389648438, -0.09531593322753906, -0.08766937255859375, -0.08002281188964844, -0.07237625122070312, -0.06472969055175781, -0.0570831298828125, -0.04943656921386719, -0.041790008544921875, -0.03414344787597656, -0.02649688720703125, -0.018850326538085938, -0.011203765869140625, -0.0035572052001953125, 0.00408935546875, 0.011735916137695312, 0.019382476806640625, 0.027029037475585938, 0.03467559814453125, 0.04232215881347656, 0.049968719482421875, 0.05761528015136719, 0.0652618408203125, 0.07290840148925781, 0.08055496215820312, 0.08820152282714844, 0.09584808349609375, 0.10349464416503906, 0.11114120483398438, 0.11878776550292969, 0.126434326171875, 0.1340808868408203, 0.14172744750976562, 0.14937400817871094, 0.15702056884765625, 0.16466712951660156, 0.17231369018554688, 0.1799602508544922, 0.1876068115234375, 0.1952533721923828, 0.20289993286132812, 0.21054649353027344, 0.21819305419921875, 0.22583961486816406, 0.23348617553710938, 0.2411327362060547, 0.248779296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 9.0, 8.0, 13.0, 24.0, 22.0, 42.0, 55.0, 81.0, 117.0, 187.0, 279.0, 404.0, 693.0, 1377.0, 3635.0, 28068.0, 827793.0, 172358.0, 8675.0, 2134.0, 1015.0, 521.0, 341.0, 220.0, 147.0, 119.0, 69.0, 44.0, 28.0, 17.0, 15.0, 14.0, 11.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72509765625, -0.7029647827148438, -0.6808319091796875, -0.6586990356445312, -0.636566162109375, -0.6144332885742188, -0.5923004150390625, -0.5701675415039062, -0.54803466796875, -0.5259017944335938, -0.5037689208984375, -0.48163604736328125, -0.459503173828125, -0.43737030029296875, -0.4152374267578125, -0.39310455322265625, -0.3709716796875, -0.34883880615234375, -0.3267059326171875, -0.30457305908203125, -0.282440185546875, -0.26030731201171875, -0.2381744384765625, -0.21604156494140625, -0.19390869140625, -0.17177581787109375, -0.1496429443359375, -0.12751007080078125, -0.105377197265625, -0.08324432373046875, -0.0611114501953125, -0.03897857666015625, -0.016845703125, 0.00528717041015625, 0.0274200439453125, 0.04955291748046875, 0.071685791015625, 0.09381866455078125, 0.1159515380859375, 0.13808441162109375, 0.16021728515625, 0.18235015869140625, 0.2044830322265625, 0.22661590576171875, 0.248748779296875, 0.27088165283203125, 0.2930145263671875, 0.31514739990234375, 0.3372802734375, 0.35941314697265625, 0.3815460205078125, 0.40367889404296875, 0.425811767578125, 0.44794464111328125, 0.4700775146484375, 0.49221038818359375, 0.51434326171875, 0.5364761352539062, 0.5586090087890625, 0.5807418823242188, 0.602874755859375, 0.6250076293945312, 0.6471405029296875, 0.6692733764648438, 0.69140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 3.0, 5.0, 7.0, 12.0, 14.0, 18.0, 15.0, 19.0, 19.0, 30.0, 19.0, 45.0, 38.0, 36.0, 33.0, 48.0, 48.0, 50.0, 54.0, 44.0, 55.0, 47.0, 39.0, 42.0, 38.0, 34.0, 22.0, 28.0, 22.0, 18.0, 16.0, 10.0, 16.0, 9.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6630859375, -0.6439285278320312, -0.6247711181640625, -0.6056137084960938, -0.586456298828125, -0.5672988891601562, -0.5481414794921875, -0.5289840698242188, -0.50982666015625, -0.49066925048828125, -0.4715118408203125, -0.45235443115234375, -0.433197021484375, -0.41403961181640625, -0.3948822021484375, -0.37572479248046875, -0.3565673828125, -0.33740997314453125, -0.3182525634765625, -0.29909515380859375, -0.279937744140625, -0.26078033447265625, -0.2416229248046875, -0.22246551513671875, -0.20330810546875, -0.18415069580078125, -0.1649932861328125, -0.14583587646484375, -0.126678466796875, -0.10752105712890625, -0.0883636474609375, -0.06920623779296875, -0.050048828125, -0.03089141845703125, -0.0117340087890625, 0.00742340087890625, 0.026580810546875, 0.04573822021484375, 0.0648956298828125, 0.08405303955078125, 0.10321044921875, 0.12236785888671875, 0.1415252685546875, 0.16068267822265625, 0.179840087890625, 0.19899749755859375, 0.2181549072265625, 0.23731231689453125, 0.2564697265625, 0.27562713623046875, 0.2947845458984375, 0.31394195556640625, 0.333099365234375, 0.35225677490234375, 0.3714141845703125, 0.39057159423828125, 0.40972900390625, 0.42888641357421875, 0.4480438232421875, 0.46720123291015625, 0.486358642578125, 0.5055160522460938, 0.5246734619140625, 0.5438308715820312, 0.56298828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 8.0, 4.0, 12.0, 9.0, 7.0, 23.0, 18.0, 22.0, 40.0, 65.0, 83.0, 162.0, 330.0, 885.0, 3623.0, 40757.0, 917753.0, 77554.0, 5220.0, 1115.0, 392.0, 167.0, 91.0, 51.0, 34.0, 26.0, 24.0, 15.0, 15.0, 11.0, 4.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2113037109375, -0.2036457061767578, -0.19598770141601562, -0.18832969665527344, -0.18067169189453125, -0.17301368713378906, -0.16535568237304688, -0.1576976776123047, -0.1500396728515625, -0.1423816680908203, -0.13472366333007812, -0.12706565856933594, -0.11940765380859375, -0.11174964904785156, -0.10409164428710938, -0.09643363952636719, -0.088775634765625, -0.08111763000488281, -0.07345962524414062, -0.06580162048339844, -0.05814361572265625, -0.05048561096191406, -0.042827606201171875, -0.03516960144042969, -0.0275115966796875, -0.019853591918945312, -0.012195587158203125, -0.0045375823974609375, 0.00312042236328125, 0.010778427124023438, 0.018436431884765625, 0.026094436645507812, 0.03375244140625, 0.04141044616699219, 0.049068450927734375, 0.05672645568847656, 0.06438446044921875, 0.07204246520996094, 0.07970046997070312, 0.08735847473144531, 0.0950164794921875, 0.10267448425292969, 0.11033248901367188, 0.11799049377441406, 0.12564849853515625, 0.13330650329589844, 0.14096450805664062, 0.1486225128173828, 0.156280517578125, 0.1639385223388672, 0.17159652709960938, 0.17925453186035156, 0.18691253662109375, 0.19457054138183594, 0.20222854614257812, 0.2098865509033203, 0.2175445556640625, 0.2252025604248047, 0.23286056518554688, 0.24051856994628906, 0.24817657470703125, 0.25583457946777344, 0.2634925842285156, 0.2711505889892578, 0.27880859375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 6.0, 7.0, 14.0, 16.0, 27.0, 35.0, 58.0, 115.0, 182.0, 176.0, 126.0, 54.0, 40.0, 30.0, 23.0, 16.0, 16.0, 5.0, 5.0, 2.0, 5.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011849403381347656, -0.0001147901639342308, -0.00011108629405498505, -0.00010738242417573929, -0.00010367855429649353, -9.997468441724777e-05, -9.627081453800201e-05, -9.256694465875626e-05, -8.88630747795105e-05, -8.515920490026474e-05, -8.145533502101898e-05, -7.775146514177322e-05, -7.404759526252747e-05, -7.034372538328171e-05, -6.663985550403595e-05, -6.293598562479019e-05, -5.9232115745544434e-05, -5.5528245866298676e-05, -5.182437598705292e-05, -4.812050610780716e-05, -4.44166362285614e-05, -4.071276634931564e-05, -3.7008896470069885e-05, -3.330502659082413e-05, -2.960115671157837e-05, -2.589728683233261e-05, -2.2193416953086853e-05, -1.8489547073841095e-05, -1.4785677194595337e-05, -1.1081807315349579e-05, -7.377937436103821e-06, -3.6740675568580627e-06, 2.9802322387695312e-08, 3.7336722016334534e-06, 7.4375420808792114e-06, 1.114141196012497e-05, 1.4845281839370728e-05, 1.8549151718616486e-05, 2.2253021597862244e-05, 2.5956891477108002e-05, 2.966076135635376e-05, 3.336463123559952e-05, 3.7068501114845276e-05, 4.0772370994091034e-05, 4.447624087333679e-05, 4.818011075258255e-05, 5.188398063182831e-05, 5.5587850511074066e-05, 5.9291720390319824e-05, 6.299559026956558e-05, 6.669946014881134e-05, 7.04033300280571e-05, 7.410719990730286e-05, 7.781106978654861e-05, 8.151493966579437e-05, 8.521880954504013e-05, 8.892267942428589e-05, 9.262654930353165e-05, 9.63304191827774e-05, 0.00010003428906202316, 0.00010373815894126892, 0.00010744202882051468, 0.00011114589869976044, 0.0001148497685790062, 0.00011855363845825195]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 1.0, 7.0, 9.0, 13.0, 15.0, 31.0, 54.0, 66.0, 132.0, 209.0, 461.0, 1181.0, 3986.0, 27238.0, 793351.0, 206421.0, 11372.0, 2376.0, 799.0, 380.0, 183.0, 95.0, 61.0, 41.0, 16.0, 16.0, 8.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.16910743713378906, -0.16255569458007812, -0.1560039520263672, -0.14945220947265625, -0.1429004669189453, -0.13634872436523438, -0.12979698181152344, -0.1232452392578125, -0.11669349670410156, -0.11014175415039062, -0.10359001159667969, -0.09703826904296875, -0.09048652648925781, -0.08393478393554688, -0.07738304138183594, -0.070831298828125, -0.06427955627441406, -0.057727813720703125, -0.05117607116699219, -0.04462432861328125, -0.03807258605957031, -0.031520843505859375, -0.024969100952148438, -0.0184173583984375, -0.011865615844726562, -0.005313873291015625, 0.0012378692626953125, 0.00778961181640625, 0.014341354370117188, 0.020893096923828125, 0.027444839477539062, 0.03399658203125, 0.04054832458496094, 0.047100067138671875, 0.05365180969238281, 0.06020355224609375, 0.06675529479980469, 0.07330703735351562, 0.07985877990722656, 0.0864105224609375, 0.09296226501464844, 0.09951400756835938, 0.10606575012207031, 0.11261749267578125, 0.11916923522949219, 0.12572097778320312, 0.13227272033691406, 0.138824462890625, 0.14537620544433594, 0.15192794799804688, 0.1584796905517578, 0.16503143310546875, 0.1715831756591797, 0.17813491821289062, 0.18468666076660156, 0.1912384033203125, 0.19779014587402344, 0.20434188842773438, 0.2108936309814453, 0.21744537353515625, 0.2239971160888672, 0.23054885864257812, 0.23710060119628906, 0.24365234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 4.0, 5.0, 3.0, 5.0, 14.0, 5.0, 22.0, 20.0, 38.0, 39.0, 64.0, 66.0, 73.0, 89.0, 90.0, 79.0, 67.0, 71.0, 42.0, 44.0, 28.0, 31.0, 10.0, 13.0, 5.0, 16.0, 8.0, 9.0, 4.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0], "bins": [-0.1424560546875, -0.13886260986328125, -0.1352691650390625, -0.13167572021484375, -0.128082275390625, -0.12448883056640625, -0.1208953857421875, -0.11730194091796875, -0.11370849609375, -0.11011505126953125, -0.1065216064453125, -0.10292816162109375, -0.099334716796875, -0.09574127197265625, -0.0921478271484375, -0.08855438232421875, -0.0849609375, -0.08136749267578125, -0.0777740478515625, -0.07418060302734375, -0.070587158203125, -0.06699371337890625, -0.0634002685546875, -0.05980682373046875, -0.05621337890625, -0.05261993408203125, -0.0490264892578125, -0.04543304443359375, -0.041839599609375, -0.03824615478515625, -0.0346527099609375, -0.03105926513671875, -0.0274658203125, -0.02387237548828125, -0.0202789306640625, -0.01668548583984375, -0.013092041015625, -0.00949859619140625, -0.0059051513671875, -0.00231170654296875, 0.00128173828125, 0.00487518310546875, 0.0084686279296875, 0.01206207275390625, 0.015655517578125, 0.01924896240234375, 0.0228424072265625, 0.02643585205078125, 0.030029296875, 0.03362274169921875, 0.0372161865234375, 0.04080963134765625, 0.044403076171875, 0.04799652099609375, 0.0515899658203125, 0.05518341064453125, 0.05877685546875, 0.06237030029296875, 0.0659637451171875, 0.06955718994140625, 0.073150634765625, 0.07674407958984375, 0.0803375244140625, 0.08393096923828125, 0.0875244140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 18.0, 80.0, 295.0, 394.0, 114.0, 34.0, 22.0, 11.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9648702144622803, -1.7874879837036133, -1.6101056337356567, -1.4327232837677002, -1.2553410530090332, -1.0779588222503662, -0.9005764722824097, -0.7231941223144531, -0.5458118915557861, -0.36842960119247437, -0.1910473108291626, -0.01366502046585083, 0.16371726989746094, 0.3410995602607727, 0.5184818506240845, 0.695864200592041, 0.873246431350708, 1.050628662109375, 1.2280110120773315, 1.405393362045288, 1.582775592803955, 1.760157823562622, 1.9375401735305786, 2.114922523498535, 2.292304754257202, 2.469686985015869, 2.6470694541931152, 2.8244516849517822, 3.001833915710449, 3.179216146469116, 3.356598377227783, 3.5339808464050293, 3.711362838745117, 3.888745069503784, 4.066127300262451, 4.243509769439697, 4.420891761779785, 4.598274230957031, 4.775656700134277, 4.953039169311523, 5.130421161651611, 5.307803630828857, 5.485185623168945, 5.662568092346191, 5.8399505615234375, 6.017332553863525, 6.1947150230407715, 6.372097015380859, 6.5494794845581055, 6.726861953735352, 6.9042439460754395, 7.0816264152526855, 7.259008407592773, 7.4363908767700195, 7.613773345947266, 7.791155815124512, 7.9685378074646, 8.145919799804688, 8.323302268981934, 8.50068473815918, 8.678067207336426, 8.855449676513672, 9.032831192016602, 9.210213661193848, 9.387596130371094]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 5.0, 6.0, 2.0, 3.0, 5.0, 11.0, 12.0, 15.0, 15.0, 8.0, 21.0, 23.0, 14.0, 23.0, 21.0, 34.0, 21.0, 29.0, 29.0, 33.0, 52.0, 68.0, 58.0, 55.0, 60.0, 34.0, 53.0, 44.0, 24.0, 22.0, 28.0, 20.0, 25.0, 21.0, 17.0, 12.0, 13.0, 10.0, 9.0, 6.0, 9.0, 6.0, 8.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.0536327362060547, -1.9866238832473755, -1.9196151494979858, -1.8526062965393066, -1.785597562789917, -1.7185887098312378, -1.6515798568725586, -1.584571123123169, -1.5175623893737793, -1.4505535364151, -1.3835448026657104, -1.3165359497070312, -1.2495272159576416, -1.1825183629989624, -1.1155095100402832, -1.0485007762908936, -0.9814919233322144, -0.9144831299781799, -0.8474743366241455, -0.7804654836654663, -0.7134567499160767, -0.6464478969573975, -0.579439103603363, -0.5124303102493286, -0.4454215168952942, -0.37841272354125977, -0.31140393018722534, -0.24439510703086853, -0.1773863136768341, -0.11037752032279968, -0.04336869716644287, 0.023640096187591553, 0.09064888954162598, 0.1576576828956604, 0.22466649115085602, 0.29167529940605164, 0.35868409276008606, 0.4256928861141205, 0.4927017092704773, 0.5597105026245117, 0.6267192959785461, 0.6937280893325806, 0.760736882686615, 0.8277456760406494, 0.8947545289993286, 0.9617632627487183, 1.0287721157073975, 1.095780849456787, 1.1627897024154663, 1.2297985553741455, 1.2968072891235352, 1.3638161420822144, 1.430824875831604, 1.4978337287902832, 1.5648424625396729, 1.631851315498352, 1.6988601684570312, 1.7658690214157104, 1.8328777551651, 1.8998866081237793, 1.966895341873169, 2.0339040756225586, 2.1009130477905273, 2.167921781539917, 2.2349305152893066]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 11.0, 18.0, 29.0, 49.0, 83.0, 198.0, 473.0, 1685.0, 12565.0, 685095.0, 3442515.0, 47180.0, 3140.0, 677.0, 276.0, 145.0, 71.0, 34.0, 23.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6435546875, -0.6283111572265625, -0.613067626953125, -0.5978240966796875, -0.58258056640625, -0.5673370361328125, -0.552093505859375, -0.5368499755859375, -0.5216064453125, -0.5063629150390625, -0.491119384765625, -0.4758758544921875, -0.46063232421875, -0.4453887939453125, -0.430145263671875, -0.4149017333984375, -0.399658203125, -0.3844146728515625, -0.369171142578125, -0.3539276123046875, -0.33868408203125, -0.3234405517578125, -0.308197021484375, -0.2929534912109375, -0.2777099609375, -0.2624664306640625, -0.247222900390625, -0.2319793701171875, -0.21673583984375, -0.2014923095703125, -0.186248779296875, -0.1710052490234375, -0.15576171875, -0.1405181884765625, -0.125274658203125, -0.1100311279296875, -0.09478759765625, -0.0795440673828125, -0.064300537109375, -0.0490570068359375, -0.0338134765625, -0.0185699462890625, -0.003326416015625, 0.0119171142578125, 0.02716064453125, 0.0424041748046875, 0.057647705078125, 0.0728912353515625, 0.088134765625, 0.1033782958984375, 0.118621826171875, 0.1338653564453125, 0.14910888671875, 0.1643524169921875, 0.179595947265625, 0.1948394775390625, 0.2100830078125, 0.2253265380859375, 0.240570068359375, 0.2558135986328125, 0.27105712890625, 0.2863006591796875, 0.301544189453125, 0.3167877197265625, 0.33203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 11.0, 13.0, 8.0, 13.0, 30.0, 39.0, 44.0, 43.0, 60.0, 61.0, 74.0, 75.0, 74.0, 58.0, 74.0, 65.0, 45.0, 49.0, 37.0, 38.0, 25.0, 22.0, 10.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.23218345642089844, -0.22449874877929688, -0.2168140411376953, -0.20912933349609375, -0.2014446258544922, -0.19375991821289062, -0.18607521057128906, -0.1783905029296875, -0.17070579528808594, -0.16302108764648438, -0.1553363800048828, -0.14765167236328125, -0.1399669647216797, -0.13228225708007812, -0.12459754943847656, -0.116912841796875, -0.10922813415527344, -0.10154342651367188, -0.09385871887207031, -0.08617401123046875, -0.07848930358886719, -0.07080459594726562, -0.06311988830566406, -0.0554351806640625, -0.04775047302246094, -0.040065765380859375, -0.03238105773925781, -0.02469635009765625, -0.017011642456054688, -0.009326934814453125, -0.0016422271728515625, 0.00604248046875, 0.013727188110351562, 0.021411895751953125, 0.029096603393554688, 0.03678131103515625, 0.04446601867675781, 0.052150726318359375, 0.05983543395996094, 0.0675201416015625, 0.07520484924316406, 0.08288955688476562, 0.09057426452636719, 0.09825897216796875, 0.10594367980957031, 0.11362838745117188, 0.12131309509277344, 0.128997802734375, 0.13668251037597656, 0.14436721801757812, 0.1520519256591797, 0.15973663330078125, 0.1674213409423828, 0.17510604858398438, 0.18279075622558594, 0.1904754638671875, 0.19816017150878906, 0.20584487915039062, 0.2135295867919922, 0.22121429443359375, 0.2288990020751953, 0.23658370971679688, 0.24426841735839844, 0.251953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 15.0, 28.0, 38.0, 77.0, 187.0, 470.0, 1185.0, 3411.0, 23994.0, 4034642.0, 123343.0, 4695.0, 1259.0, 461.0, 238.0, 115.0, 53.0, 18.0, 21.0, 12.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6123046875, -0.5884628295898438, -0.5646209716796875, -0.5407791137695312, -0.516937255859375, -0.49309539794921875, -0.4692535400390625, -0.44541168212890625, -0.42156982421875, -0.39772796630859375, -0.3738861083984375, -0.35004425048828125, -0.326202392578125, -0.30236053466796875, -0.2785186767578125, -0.25467681884765625, -0.2308349609375, -0.20699310302734375, -0.1831512451171875, -0.15930938720703125, -0.135467529296875, -0.11162567138671875, -0.0877838134765625, -0.06394195556640625, -0.04010009765625, -0.01625823974609375, 0.0075836181640625, 0.03142547607421875, 0.055267333984375, 0.07910919189453125, 0.1029510498046875, 0.12679290771484375, 0.150634765625, 0.17447662353515625, 0.1983184814453125, 0.22216033935546875, 0.246002197265625, 0.26984405517578125, 0.2936859130859375, 0.31752777099609375, 0.34136962890625, 0.36521148681640625, 0.3890533447265625, 0.41289520263671875, 0.436737060546875, 0.46057891845703125, 0.4844207763671875, 0.5082626342773438, 0.5321044921875, 0.5559463500976562, 0.5797882080078125, 0.6036300659179688, 0.627471923828125, 0.6513137817382812, 0.6751556396484375, 0.6989974975585938, 0.72283935546875, 0.7466812133789062, 0.7705230712890625, 0.7943649291992188, 0.818206787109375, 0.8420486450195312, 0.8658905029296875, 0.8897323608398438, 0.91357421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 6.0, 31.0, 48.0, 98.0, 359.0, 1109.0, 1496.0, 604.0, 163.0, 70.0, 33.0, 13.0, 11.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7109375, -0.6901702880859375, -0.669403076171875, -0.6486358642578125, -0.62786865234375, -0.6071014404296875, -0.586334228515625, -0.5655670166015625, -0.5447998046875, -0.5240325927734375, -0.503265380859375, -0.4824981689453125, -0.46173095703125, -0.4409637451171875, -0.420196533203125, -0.3994293212890625, -0.378662109375, -0.3578948974609375, -0.337127685546875, -0.3163604736328125, -0.29559326171875, -0.2748260498046875, -0.254058837890625, -0.2332916259765625, -0.2125244140625, -0.1917572021484375, -0.170989990234375, -0.1502227783203125, -0.12945556640625, -0.1086883544921875, -0.087921142578125, -0.0671539306640625, -0.04638671875, -0.0256195068359375, -0.004852294921875, 0.0159149169921875, 0.03668212890625, 0.0574493408203125, 0.078216552734375, 0.0989837646484375, 0.1197509765625, 0.1405181884765625, 0.161285400390625, 0.1820526123046875, 0.20281982421875, 0.2235870361328125, 0.244354248046875, 0.2651214599609375, 0.285888671875, 0.3066558837890625, 0.327423095703125, 0.3481903076171875, 0.36895751953125, 0.3897247314453125, 0.410491943359375, 0.4312591552734375, 0.4520263671875, 0.4727935791015625, 0.493560791015625, 0.5143280029296875, 0.53509521484375, 0.5558624267578125, 0.576629638671875, 0.5973968505859375, 0.6181640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 1.0, 4.0, 9.0, 24.0, 122.0, 507.0, 268.0, 42.0, 6.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.73887825012207, -8.506672859191895, -8.274467468261719, -8.042261123657227, -7.810055732727051, -7.577850341796875, -7.345644950866699, -7.113439083099365, -6.881233215332031, -6.6490278244018555, -6.4168219566345215, -6.184616565704346, -5.952410697937012, -5.720205307006836, -5.48799991607666, -5.255794048309326, -5.02358865737915, -4.791383266448975, -4.559177398681641, -4.326972007751465, -4.094766139984131, -3.862560749053955, -3.6303551197052, -3.3981494903564453, -3.1659438610076904, -2.9337382316589355, -2.7015326023101807, -2.469326972961426, -2.23712158203125, -2.004915714263916, -1.7727103233337402, -1.5405046939849854, -1.3082990646362305, -1.0760934352874756, -0.8438878655433655, -0.6116822957992554, -0.3794766664505005, -0.1472710371017456, 0.08493447303771973, 0.3171401023864746, 0.5493457317352295, 0.7815513610839844, 1.0137569904327393, 1.2459625005722046, 1.4781681299209595, 1.7103737592697144, 1.9425792694091797, 2.1747848987579346, 2.4069905281066895, 2.6391961574554443, 2.871401786804199, 3.103607177734375, 3.335813045501709, 3.5680184364318848, 3.8002240657806396, 4.0324296951293945, 4.26463508605957, 4.496840476989746, 4.72904634475708, 4.961251735687256, 5.19345760345459, 5.425662994384766, 5.657868385314941, 5.890074253082275, 6.122280120849609]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 14.0, 16.0, 30.0, 67.0, 79.0, 87.0, 136.0, 142.0, 124.0, 109.0, 88.0, 51.0, 31.0, 11.0, 8.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.660445213317871, -3.5347414016723633, -3.4090375900268555, -3.2833337783813477, -3.1576297283172607, -3.031925916671753, -2.906222105026245, -2.7805182933807373, -2.6548142433166504, -2.5291104316711426, -2.4034066200256348, -2.277702808380127, -2.15199875831604, -2.0262949466705322, -1.9005911350250244, -1.7748873233795166, -1.6491835117340088, -1.523479700088501, -1.3977757692337036, -1.2720719575881958, -1.1463680267333984, -1.0206642150878906, -0.8949604034423828, -0.7692565321922302, -0.6435526609420776, -0.517848789691925, -0.39214494824409485, -0.26644110679626465, -0.14073723554611206, -0.015033364295959473, 0.11067044734954834, 0.23637431859970093, 0.3620781898498535, 0.4877820611000061, 0.6134859323501587, 0.7391897439956665, 0.8648936152458191, 0.9905974864959717, 1.1163012981414795, 1.2420051097869873, 1.3677090406417847, 1.4934128522872925, 1.6191167831420898, 1.7448205947875977, 1.8705244064331055, 1.9962283372879028, 2.121932029724121, 2.247636079788208, 2.373339891433716, 2.4990437030792236, 2.6247475147247314, 2.7504515647888184, 2.876155376434326, 3.001859188079834, 3.127562999725342, 3.2532668113708496, 3.3789706230163574, 3.5046744346618652, 3.630378246307373, 3.756082057952881, 3.8817861080169678, 4.007490158081055, 4.1331939697265625, 4.25889778137207, 4.384601593017578]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 1.0, 6.0, 10.0, 11.0, 20.0, 19.0, 32.0, 55.0, 83.0, 142.0, 297.0, 604.0, 1427.0, 4283.0, 19119.0, 140198.0, 654690.0, 194959.0, 24338.0, 5226.0, 1649.0, 636.0, 301.0, 160.0, 96.0, 42.0, 50.0, 17.0, 20.0, 13.0, 8.0, 10.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.43310546875, -0.4205780029296875, -0.408050537109375, -0.3955230712890625, -0.38299560546875, -0.3704681396484375, -0.357940673828125, -0.3454132080078125, -0.3328857421875, -0.3203582763671875, -0.307830810546875, -0.2953033447265625, -0.28277587890625, -0.2702484130859375, -0.257720947265625, -0.2451934814453125, -0.232666015625, -0.2201385498046875, -0.207611083984375, -0.1950836181640625, -0.18255615234375, -0.1700286865234375, -0.157501220703125, -0.1449737548828125, -0.1324462890625, -0.1199188232421875, -0.107391357421875, -0.0948638916015625, -0.08233642578125, -0.0698089599609375, -0.057281494140625, -0.0447540283203125, -0.0322265625, -0.0196990966796875, -0.007171630859375, 0.0053558349609375, 0.01788330078125, 0.0304107666015625, 0.042938232421875, 0.0554656982421875, 0.0679931640625, 0.0805206298828125, 0.093048095703125, 0.1055755615234375, 0.11810302734375, 0.1306304931640625, 0.143157958984375, 0.1556854248046875, 0.168212890625, 0.1807403564453125, 0.193267822265625, 0.2057952880859375, 0.21832275390625, 0.2308502197265625, 0.243377685546875, 0.2559051513671875, 0.2684326171875, 0.2809600830078125, 0.293487548828125, 0.3060150146484375, 0.31854248046875, 0.3310699462890625, 0.343597412109375, 0.3561248779296875, 0.36865234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 12.0, 5.0, 10.0, 12.0, 18.0, 37.0, 25.0, 36.0, 43.0, 65.0, 63.0, 74.0, 80.0, 64.0, 70.0, 66.0, 75.0, 59.0, 32.0, 41.0, 30.0, 16.0, 21.0, 14.0, 15.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.239013671875, -0.2313690185546875, -0.223724365234375, -0.2160797119140625, -0.20843505859375, -0.2007904052734375, -0.193145751953125, -0.1855010986328125, -0.1778564453125, -0.1702117919921875, -0.162567138671875, -0.1549224853515625, -0.14727783203125, -0.1396331787109375, -0.131988525390625, -0.1243438720703125, -0.11669921875, -0.1090545654296875, -0.101409912109375, -0.0937652587890625, -0.08612060546875, -0.0784759521484375, -0.070831298828125, -0.0631866455078125, -0.0555419921875, -0.0478973388671875, -0.040252685546875, -0.0326080322265625, -0.02496337890625, -0.0173187255859375, -0.009674072265625, -0.0020294189453125, 0.005615234375, 0.0132598876953125, 0.020904541015625, 0.0285491943359375, 0.03619384765625, 0.0438385009765625, 0.051483154296875, 0.0591278076171875, 0.0667724609375, 0.0744171142578125, 0.082061767578125, 0.0897064208984375, 0.09735107421875, 0.1049957275390625, 0.112640380859375, 0.1202850341796875, 0.1279296875, 0.1355743408203125, 0.143218994140625, 0.1508636474609375, 0.15850830078125, 0.1661529541015625, 0.173797607421875, 0.1814422607421875, 0.1890869140625, 0.1967315673828125, 0.204376220703125, 0.2120208740234375, 0.21966552734375, 0.2273101806640625, 0.234954833984375, 0.2425994873046875, 0.250244140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 7.0, 16.0, 20.0, 16.0, 33.0, 44.0, 34.0, 76.0, 87.0, 145.0, 208.0, 411.0, 783.0, 2085.0, 8423.0, 52166.0, 573892.0, 356924.0, 42392.0, 7123.0, 1879.0, 708.0, 344.0, 202.0, 150.0, 98.0, 66.0, 61.0, 31.0, 19.0, 20.0, 18.0, 17.0, 13.0, 6.0, 6.0, 6.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.33544921875, -0.3230018615722656, -0.31055450439453125, -0.2981071472167969, -0.2856597900390625, -0.2732124328613281, -0.26076507568359375, -0.24831771850585938, -0.235870361328125, -0.22342300415039062, -0.21097564697265625, -0.19852828979492188, -0.1860809326171875, -0.17363357543945312, -0.16118621826171875, -0.14873886108398438, -0.13629150390625, -0.12384414672851562, -0.11139678955078125, -0.09894943237304688, -0.0865020751953125, -0.07405471801757812, -0.06160736083984375, -0.049160003662109375, -0.036712646484375, -0.024265289306640625, -0.01181793212890625, 0.000629425048828125, 0.0130767822265625, 0.025524139404296875, 0.03797149658203125, 0.050418853759765625, 0.0628662109375, 0.07531356811523438, 0.08776092529296875, 0.10020828247070312, 0.1126556396484375, 0.12510299682617188, 0.13755035400390625, 0.14999771118164062, 0.162445068359375, 0.17489242553710938, 0.18733978271484375, 0.19978713989257812, 0.2122344970703125, 0.22468185424804688, 0.23712921142578125, 0.24957656860351562, 0.26202392578125, 0.2744712829589844, 0.28691864013671875, 0.2993659973144531, 0.3118133544921875, 0.3242607116699219, 0.33670806884765625, 0.3491554260253906, 0.361602783203125, 0.3740501403808594, 0.38649749755859375, 0.3989448547363281, 0.4113922119140625, 0.4238395690917969, 0.43628692626953125, 0.4487342834472656, 0.461181640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 8.0, 6.0, 5.0, 9.0, 4.0, 7.0, 6.0, 18.0, 9.0, 14.0, 15.0, 14.0, 23.0, 36.0, 29.0, 32.0, 43.0, 38.0, 47.0, 51.0, 51.0, 49.0, 49.0, 34.0, 42.0, 35.0, 35.0, 40.0, 38.0, 29.0, 29.0, 18.0, 31.0, 19.0, 19.0, 11.0, 13.0, 10.0, 7.0, 8.0, 4.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444091796875, -0.4276390075683594, -0.41118621826171875, -0.3947334289550781, -0.3782806396484375, -0.3618278503417969, -0.34537506103515625, -0.3289222717285156, -0.312469482421875, -0.2960166931152344, -0.27956390380859375, -0.2631111145019531, -0.2466583251953125, -0.23020553588867188, -0.21375274658203125, -0.19729995727539062, -0.18084716796875, -0.16439437866210938, -0.14794158935546875, -0.13148880004882812, -0.1150360107421875, -0.09858322143554688, -0.08213043212890625, -0.06567764282226562, -0.049224853515625, -0.032772064208984375, -0.01631927490234375, 0.000133514404296875, 0.0165863037109375, 0.033039093017578125, 0.04949188232421875, 0.06594467163085938, 0.0823974609375, 0.09885025024414062, 0.11530303955078125, 0.13175582885742188, 0.1482086181640625, 0.16466140747070312, 0.18111419677734375, 0.19756698608398438, 0.214019775390625, 0.23047256469726562, 0.24692535400390625, 0.2633781433105469, 0.2798309326171875, 0.2962837219238281, 0.31273651123046875, 0.3291893005371094, 0.34564208984375, 0.3620948791503906, 0.37854766845703125, 0.3950004577636719, 0.4114532470703125, 0.4279060363769531, 0.44435882568359375, 0.4608116149902344, 0.477264404296875, 0.4937171936035156, 0.5101699829101562, 0.5266227722167969, 0.5430755615234375, 0.5595283508300781, 0.5759811401367188, 0.5924339294433594, 0.60888671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 12.0, 15.0, 31.0, 44.0, 70.0, 143.0, 304.0, 997.0, 4611.0, 30459.0, 554426.0, 421533.0, 29786.0, 4446.0, 1005.0, 338.0, 143.0, 75.0, 36.0, 23.0, 13.0, 7.0, 8.0, 1.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.18947124481201172, -0.18448448181152344, -0.17949771881103516, -0.17451095581054688, -0.1695241928100586, -0.1645374298095703, -0.15955066680908203, -0.15456390380859375, -0.14957714080810547, -0.1445903778076172, -0.1396036148071289, -0.13461685180664062, -0.12963008880615234, -0.12464332580566406, -0.11965656280517578, -0.1146697998046875, -0.10968303680419922, -0.10469627380371094, -0.09970951080322266, -0.09472274780273438, -0.0897359848022461, -0.08474922180175781, -0.07976245880126953, -0.07477569580078125, -0.06978893280029297, -0.06480216979980469, -0.059815406799316406, -0.054828643798828125, -0.049841880798339844, -0.04485511779785156, -0.03986835479736328, -0.034881591796875, -0.02989482879638672, -0.024908065795898438, -0.019921302795410156, -0.014934539794921875, -0.009947776794433594, -0.0049610137939453125, 2.574920654296875e-05, 0.00501251220703125, 0.009999275207519531, 0.014986038208007812, 0.019972801208496094, 0.024959564208984375, 0.029946327209472656, 0.03493309020996094, 0.03991985321044922, 0.0449066162109375, 0.04989337921142578, 0.05488014221191406, 0.059866905212402344, 0.06485366821289062, 0.0698404312133789, 0.07482719421386719, 0.07981395721435547, 0.08480072021484375, 0.08978748321533203, 0.09477424621582031, 0.0997610092163086, 0.10474777221679688, 0.10973453521728516, 0.11472129821777344, 0.11970806121826172, 0.12469482421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 2.0, 14.0, 17.0, 29.0, 50.0, 60.0, 91.0, 125.0, 137.0, 124.0, 124.0, 70.0, 52.0, 33.0, 25.0, 9.0, 12.0, 5.0, 1.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23464584350586e-05, -6.009731441736221e-05, -5.784817039966583e-05, -5.559902638196945e-05, -5.334988236427307e-05, -5.110073834657669e-05, -4.885159432888031e-05, -4.660245031118393e-05, -4.435330629348755e-05, -4.210416227579117e-05, -3.985501825809479e-05, -3.760587424039841e-05, -3.5356730222702026e-05, -3.3107586205005646e-05, -3.0858442187309265e-05, -2.8609298169612885e-05, -2.6360154151916504e-05, -2.4111010134220123e-05, -2.1861866116523743e-05, -1.9612722098827362e-05, -1.736357808113098e-05, -1.51144340634346e-05, -1.286529004573822e-05, -1.061614602804184e-05, -8.367002010345459e-06, -6.117857992649078e-06, -3.868713974952698e-06, -1.6195699572563171e-06, 6.295740604400635e-07, 2.878718078136444e-06, 5.127862095832825e-06, 7.377006113529205e-06, 9.626150131225586e-06, 1.1875294148921967e-05, 1.4124438166618347e-05, 1.6373582184314728e-05, 1.862272620201111e-05, 2.087187021970749e-05, 2.312101423740387e-05, 2.537015825510025e-05, 2.761930227279663e-05, 2.986844629049301e-05, 3.211759030818939e-05, 3.436673432588577e-05, 3.661587834358215e-05, 3.8865022361278534e-05, 4.1114166378974915e-05, 4.3363310396671295e-05, 4.5612454414367676e-05, 4.7861598432064056e-05, 5.011074244976044e-05, 5.235988646745682e-05, 5.46090304851532e-05, 5.685817450284958e-05, 5.910731852054596e-05, 6.135646253824234e-05, 6.360560655593872e-05, 6.58547505736351e-05, 6.810389459133148e-05, 7.035303860902786e-05, 7.260218262672424e-05, 7.485132664442062e-05, 7.7100470662117e-05, 7.934961467981339e-05, 8.159875869750977e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 15.0, 16.0, 20.0, 43.0, 80.0, 130.0, 264.0, 775.0, 2737.0, 14508.0, 140450.0, 792281.0, 84067.0, 10035.0, 2004.0, 582.0, 251.0, 104.0, 68.0, 43.0, 26.0, 12.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2022705078125, -0.19738483428955078, -0.19249916076660156, -0.18761348724365234, -0.18272781372070312, -0.1778421401977539, -0.1729564666748047, -0.16807079315185547, -0.16318511962890625, -0.15829944610595703, -0.1534137725830078, -0.1485280990600586, -0.14364242553710938, -0.13875675201416016, -0.13387107849121094, -0.12898540496826172, -0.1240997314453125, -0.11921405792236328, -0.11432838439941406, -0.10944271087646484, -0.10455703735351562, -0.0996713638305664, -0.09478569030761719, -0.08990001678466797, -0.08501434326171875, -0.08012866973876953, -0.07524299621582031, -0.0703573226928711, -0.06547164916992188, -0.060585975646972656, -0.05570030212402344, -0.05081462860107422, -0.045928955078125, -0.04104328155517578, -0.03615760803222656, -0.031271934509277344, -0.026386260986328125, -0.021500587463378906, -0.016614913940429688, -0.011729240417480469, -0.00684356689453125, -0.0019578933715820312, 0.0029277801513671875, 0.007813453674316406, 0.012699127197265625, 0.017584800720214844, 0.022470474243164062, 0.02735614776611328, 0.0322418212890625, 0.03712749481201172, 0.04201316833496094, 0.046898841857910156, 0.051784515380859375, 0.056670188903808594, 0.06155586242675781, 0.06644153594970703, 0.07132720947265625, 0.07621288299560547, 0.08109855651855469, 0.0859842300415039, 0.09086990356445312, 0.09575557708740234, 0.10064125061035156, 0.10552692413330078, 0.11041259765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 8.0, 5.0, 3.0, 9.0, 14.0, 19.0, 27.0, 51.0, 56.0, 82.0, 84.0, 109.0, 133.0, 96.0, 91.0, 59.0, 32.0, 33.0, 36.0, 20.0, 11.0, 8.0, 11.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134033203125, -0.12943267822265625, -0.1248321533203125, -0.12023162841796875, -0.115631103515625, -0.11103057861328125, -0.1064300537109375, -0.10182952880859375, -0.09722900390625, -0.09262847900390625, -0.0880279541015625, -0.08342742919921875, -0.078826904296875, -0.07422637939453125, -0.0696258544921875, -0.06502532958984375, -0.0604248046875, -0.05582427978515625, -0.0512237548828125, -0.04662322998046875, -0.042022705078125, -0.03742218017578125, -0.0328216552734375, -0.02822113037109375, -0.02362060546875, -0.01902008056640625, -0.0144195556640625, -0.00981903076171875, -0.005218505859375, -0.00061798095703125, 0.0039825439453125, 0.00858306884765625, 0.01318359375, 0.01778411865234375, 0.0223846435546875, 0.02698516845703125, 0.031585693359375, 0.03618621826171875, 0.0407867431640625, 0.04538726806640625, 0.04998779296875, 0.05458831787109375, 0.0591888427734375, 0.06378936767578125, 0.068389892578125, 0.07299041748046875, 0.0775909423828125, 0.08219146728515625, 0.0867919921875, 0.09139251708984375, 0.0959930419921875, 0.10059356689453125, 0.105194091796875, 0.10979461669921875, 0.1143951416015625, 0.11899566650390625, 0.12359619140625, 0.12819671630859375, 0.1327972412109375, 0.13739776611328125, 0.141998291015625, 0.14659881591796875, 0.1511993408203125, 0.15579986572265625, 0.160400390625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 5.0, 14.0, 41.0, 119.0, 313.0, 374.0, 82.0, 26.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.067654132843018, -6.907448768615723, -6.747243881225586, -6.587038516998291, -6.426833152770996, -6.266628265380859, -6.1064229011535645, -5.9462175369262695, -5.786012649536133, -5.625807285308838, -5.465602397918701, -5.305397033691406, -5.1451921463012695, -4.984986782073975, -4.82478141784668, -4.664576530456543, -4.504371166229248, -4.344165802001953, -4.183960914611816, -4.0237555503845215, -3.8635504245758057, -3.70334529876709, -3.543139934539795, -3.382934808731079, -3.2227296829223633, -3.0625245571136475, -2.9023194313049316, -2.7421140670776367, -2.581908941268921, -2.421703815460205, -2.26149845123291, -2.1012933254241943, -1.9410877227783203, -1.7808825969696045, -1.6206773519515991, -1.4604721069335938, -1.300266981124878, -1.140061855316162, -0.9798566102981567, -0.8196513652801514, -0.6594462394714355, -0.49924105405807495, -0.33903586864471436, -0.17883068323135376, -0.018625497817993164, 0.14157968759536743, 0.301784873008728, 0.4619901180267334, 0.6221952438354492, 0.7824004292488098, 0.9426056146621704, 1.1028108596801758, 1.2630159854888916, 1.4232211112976074, 1.5834263563156128, 1.7436316013336182, 1.903836727142334, 2.06404185295105, 2.2242469787597656, 2.3844523429870605, 2.5446574687957764, 2.704862594604492, 2.865067958831787, 3.025273084640503, 3.1854782104492188]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 7.0, 8.0, 11.0, 9.0, 7.0, 18.0, 24.0, 18.0, 12.0, 31.0, 28.0, 29.0, 35.0, 28.0, 35.0, 58.0, 62.0, 81.0, 78.0, 54.0, 42.0, 42.0, 24.0, 33.0, 27.0, 35.0, 26.0, 22.0, 16.0, 17.0, 12.0, 17.0, 10.0, 6.0, 7.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9093279838562012, -1.8437790870666504, -1.7782301902770996, -1.7126811742782593, -1.6471322774887085, -1.5815833806991577, -1.5160343647003174, -1.4504854679107666, -1.3849365711212158, -1.319387674331665, -1.2538387775421143, -1.188289761543274, -1.1227408647537231, -1.0571919679641724, -0.9916430115699768, -0.9260940551757812, -0.8605451583862305, -0.7949962615966797, -0.7294473052024841, -0.6638983488082886, -0.5983494520187378, -0.532800555229187, -0.46725159883499146, -0.4017026722431183, -0.3361537456512451, -0.27060481905937195, -0.20505589246749878, -0.1395069658756256, -0.07395803928375244, -0.008409112691879272, 0.057139813899993896, 0.12268874049186707, 0.18823742866516113, 0.2537863552570343, 0.31933528184890747, 0.38488420844078064, 0.4504331350326538, 0.5159820318222046, 0.5815309882164001, 0.6470799446105957, 0.7126288414001465, 0.7781777381896973, 0.8437266945838928, 0.9092756509780884, 0.9748245477676392, 1.04037344455719, 1.1059224605560303, 1.171471357345581, 1.2370202541351318, 1.3025691509246826, 1.3681180477142334, 1.4336670637130737, 1.4992159605026245, 1.5647648572921753, 1.6303138732910156, 1.6958627700805664, 1.7614116668701172, 1.826960563659668, 1.8925094604492188, 1.958058476448059, 2.0236072540283203, 2.08915638923645, 2.154705286026001, 2.2202541828155518, 2.2858030796051025]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 10.0, 5.0, 12.0, 23.0, 35.0, 43.0, 70.0, 142.0, 250.0, 538.0, 1440.0, 4490.0, 19139.0, 192557.0, 2501049.0, 1368568.0, 89454.0, 11532.0, 3000.0, 1032.0, 395.0, 183.0, 110.0, 61.0, 33.0, 26.0, 18.0, 7.0, 11.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.24609375, -0.23836708068847656, -0.23064041137695312, -0.2229137420654297, -0.21518707275390625, -0.2074604034423828, -0.19973373413085938, -0.19200706481933594, -0.1842803955078125, -0.17655372619628906, -0.16882705688476562, -0.1611003875732422, -0.15337371826171875, -0.1456470489501953, -0.13792037963867188, -0.13019371032714844, -0.122467041015625, -0.11474037170410156, -0.10701370239257812, -0.09928703308105469, -0.09156036376953125, -0.08383369445800781, -0.07610702514648438, -0.06838035583496094, -0.0606536865234375, -0.05292701721191406, -0.045200347900390625, -0.03747367858886719, -0.02974700927734375, -0.022020339965820312, -0.014293670654296875, -0.0065670013427734375, 0.00115966796875, 0.008886337280273438, 0.016613006591796875, 0.024339675903320312, 0.03206634521484375, 0.03979301452636719, 0.047519683837890625, 0.05524635314941406, 0.0629730224609375, 0.07069969177246094, 0.07842636108398438, 0.08615303039550781, 0.09387969970703125, 0.10160636901855469, 0.10933303833007812, 0.11705970764160156, 0.124786376953125, 0.13251304626464844, 0.14023971557617188, 0.1479663848876953, 0.15569305419921875, 0.1634197235107422, 0.17114639282226562, 0.17887306213378906, 0.1865997314453125, 0.19432640075683594, 0.20205307006835938, 0.2097797393798828, 0.21750640869140625, 0.2252330780029297, 0.23295974731445312, 0.24068641662597656, 0.2484130859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 6.0, 13.0, 11.0, 18.0, 22.0, 32.0, 40.0, 45.0, 66.0, 55.0, 89.0, 70.0, 71.0, 68.0, 86.0, 64.0, 56.0, 29.0, 34.0, 42.0, 28.0, 13.0, 11.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2464599609375, -0.2388324737548828, -0.23120498657226562, -0.22357749938964844, -0.21595001220703125, -0.20832252502441406, -0.20069503784179688, -0.1930675506591797, -0.1854400634765625, -0.1778125762939453, -0.17018508911132812, -0.16255760192871094, -0.15493011474609375, -0.14730262756347656, -0.13967514038085938, -0.1320476531982422, -0.124420166015625, -0.11679267883300781, -0.10916519165039062, -0.10153770446777344, -0.09391021728515625, -0.08628273010253906, -0.07865524291992188, -0.07102775573730469, -0.0634002685546875, -0.05577278137207031, -0.048145294189453125, -0.04051780700683594, -0.03289031982421875, -0.025262832641601562, -0.017635345458984375, -0.010007858276367188, -0.00238037109375, 0.0052471160888671875, 0.012874603271484375, 0.020502090454101562, 0.02812957763671875, 0.03575706481933594, 0.043384552001953125, 0.05101203918457031, 0.0586395263671875, 0.06626701354980469, 0.07389450073242188, 0.08152198791503906, 0.08914947509765625, 0.09677696228027344, 0.10440444946289062, 0.11203193664550781, 0.119659423828125, 0.1272869110107422, 0.13491439819335938, 0.14254188537597656, 0.15016937255859375, 0.15779685974121094, 0.16542434692382812, 0.1730518341064453, 0.1806793212890625, 0.1883068084716797, 0.19593429565429688, 0.20356178283691406, 0.21118927001953125, 0.21881675720214844, 0.22644424438476562, 0.2340717315673828, 0.24169921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 5.0, 7.0, 7.0, 14.0, 22.0, 35.0, 44.0, 63.0, 107.0, 195.0, 393.0, 851.0, 2787.0, 11995.0, 98028.0, 2926017.0, 1096862.0, 45979.0, 7392.0, 1981.0, 699.0, 344.0, 153.0, 89.0, 61.0, 42.0, 28.0, 20.0, 17.0, 7.0, 9.0, 4.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2646484375, -0.2554740905761719, -0.24629974365234375, -0.23712539672851562, -0.2279510498046875, -0.21877670288085938, -0.20960235595703125, -0.20042800903320312, -0.191253662109375, -0.18207931518554688, -0.17290496826171875, -0.16373062133789062, -0.1545562744140625, -0.14538192749023438, -0.13620758056640625, -0.12703323364257812, -0.11785888671875, -0.10868453979492188, -0.09951019287109375, -0.09033584594726562, -0.0811614990234375, -0.07198715209960938, -0.06281280517578125, -0.053638458251953125, -0.044464111328125, -0.035289764404296875, -0.02611541748046875, -0.016941070556640625, -0.0077667236328125, 0.001407623291015625, 0.01058197021484375, 0.019756317138671875, 0.0289306640625, 0.038105010986328125, 0.04727935791015625, 0.056453704833984375, 0.0656280517578125, 0.07480239868164062, 0.08397674560546875, 0.09315109252929688, 0.102325439453125, 0.11149978637695312, 0.12067413330078125, 0.12984848022460938, 0.1390228271484375, 0.14819717407226562, 0.15737152099609375, 0.16654586791992188, 0.17572021484375, 0.18489456176757812, 0.19406890869140625, 0.20324325561523438, 0.2124176025390625, 0.22159194946289062, 0.23076629638671875, 0.23994064331054688, 0.249114990234375, 0.2582893371582031, 0.26746368408203125, 0.2766380310058594, 0.2858123779296875, 0.2949867248535156, 0.30416107177734375, 0.3133354187011719, 0.322509765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 9.0, 6.0, 10.0, 18.0, 17.0, 28.0, 40.0, 77.0, 105.0, 165.0, 293.0, 426.0, 620.0, 650.0, 567.0, 389.0, 226.0, 140.0, 89.0, 54.0, 27.0, 35.0, 19.0, 18.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.2312297821044922, -0.22307968139648438, -0.21492958068847656, -0.20677947998046875, -0.19862937927246094, -0.19047927856445312, -0.1823291778564453, -0.1741790771484375, -0.1660289764404297, -0.15787887573242188, -0.14972877502441406, -0.14157867431640625, -0.13342857360839844, -0.12527847290039062, -0.11712837219238281, -0.108978271484375, -0.10082817077636719, -0.09267807006835938, -0.08452796936035156, -0.07637786865234375, -0.06822776794433594, -0.060077667236328125, -0.05192756652832031, -0.0437774658203125, -0.03562736511230469, -0.027477264404296875, -0.019327163696289062, -0.01117706298828125, -0.0030269622802734375, 0.005123138427734375, 0.013273239135742188, 0.02142333984375, 0.029573440551757812, 0.037723541259765625, 0.04587364196777344, 0.05402374267578125, 0.06217384338378906, 0.07032394409179688, 0.07847404479980469, 0.0866241455078125, 0.09477424621582031, 0.10292434692382812, 0.11107444763183594, 0.11922454833984375, 0.12737464904785156, 0.13552474975585938, 0.1436748504638672, 0.151824951171875, 0.1599750518798828, 0.16812515258789062, 0.17627525329589844, 0.18442535400390625, 0.19257545471191406, 0.20072555541992188, 0.2088756561279297, 0.2170257568359375, 0.2251758575439453, 0.23332595825195312, 0.24147605895996094, 0.24962615966796875, 0.25777626037597656, 0.2659263610839844, 0.2740764617919922, 0.2822265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 17.0, 18.0, 32.0, 66.0, 111.0, 146.0, 175.0, 161.0, 109.0, 83.0, 34.0, 18.0, 6.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3326082229614258, -1.2683184146881104, -1.204028606414795, -1.1397387981414795, -1.075448989868164, -1.0111591815948486, -0.9468694925308228, -0.8825796842575073, -0.8182898759841919, -0.7540000677108765, -0.689710259437561, -0.6254205107688904, -0.561130702495575, -0.4968408942222595, -0.4325511157512665, -0.36826133728027344, -0.303971529006958, -0.23968173563480377, -0.17539194226264954, -0.1111021488904953, -0.046812355518341064, 0.017477452754974365, 0.08176723122596741, 0.14605700969696045, 0.21034681797027588, 0.2746366262435913, 0.33892640471458435, 0.4032161831855774, 0.4675059914588928, 0.5317957997322083, 0.5960855484008789, 0.6603753566741943, 0.7246651649475098, 0.7889549732208252, 0.8532447814941406, 0.9175345301628113, 0.9818243384361267, 1.046114206314087, 1.1104038953781128, 1.1746937036514282, 1.2389835119247437, 1.303273320198059, 1.3675631284713745, 1.43185293674469, 1.4961426258087158, 1.5604324340820312, 1.6247222423553467, 1.689012050628662, 1.7533018589019775, 1.817591667175293, 1.8818814754486084, 1.9461712837219238, 2.0104610919952393, 2.0747509002685547, 2.13904070854187, 2.2033305168151855, 2.267620086669922, 2.3319098949432373, 2.3961997032165527, 2.460489511489868, 2.5247793197631836, 2.589069128036499, 2.6533589363098145, 2.717648506164551, 2.7819385528564453]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 7.0, 6.0, 6.0, 13.0, 14.0, 20.0, 16.0, 23.0, 28.0, 30.0, 32.0, 49.0, 51.0, 47.0, 49.0, 66.0, 62.0, 60.0, 50.0, 60.0, 41.0, 37.0, 38.0, 43.0, 39.0, 28.0, 21.0, 17.0, 18.0, 13.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.6954822540283203, -1.6533327102661133, -1.6111831665039062, -1.5690336227416992, -1.5268839597702026, -1.4847344160079956, -1.4425848722457886, -1.4004353284835815, -1.358285665512085, -1.316136121749878, -1.273986577987671, -1.2318370342254639, -1.1896873712539673, -1.1475378274917603, -1.1053882837295532, -1.0632387399673462, -1.0210891962051392, -0.9789396524429321, -0.9367900490760803, -0.8946405053138733, -0.8524909019470215, -0.8103413581848145, -0.7681918144226074, -0.7260422706604004, -0.6838926672935486, -0.6417431235313416, -0.5995935201644897, -0.5574439764022827, -0.5152944326400757, -0.4731448292732239, -0.43099528551101685, -0.3888457119464874, -0.346696138381958, -0.3045465648174286, -0.26239699125289917, -0.22024744749069214, -0.17809787392616272, -0.1359483003616333, -0.09379875659942627, -0.05164918303489685, -0.009499609470367432, 0.03264995664358139, 0.07479952275753021, 0.11694908142089844, 0.15909865498542786, 0.20124822854995728, 0.2433977723121643, 0.2855473458766937, 0.32769691944122314, 0.36984649300575256, 0.411996066570282, 0.454145610332489, 0.49629518389701843, 0.5384447574615479, 0.5805943012237549, 0.6227438449859619, 0.6648934483528137, 0.7070429921150208, 0.7491925954818726, 0.7913421392440796, 0.8334916830062866, 0.8756412863731384, 0.9177908301353455, 0.9599404335021973, 1.0020899772644043]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 8.0, 15.0, 23.0, 35.0, 42.0, 107.0, 151.0, 298.0, 597.0, 1639.0, 5855.0, 30378.0, 218258.0, 632949.0, 131852.0, 19857.0, 4093.0, 1249.0, 514.0, 276.0, 156.0, 70.0, 50.0, 28.0, 17.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3946685791015625, -0.383819580078125, -0.3729705810546875, -0.36212158203125, -0.3512725830078125, -0.340423583984375, -0.3295745849609375, -0.3187255859375, -0.3078765869140625, -0.297027587890625, -0.2861785888671875, -0.27532958984375, -0.2644805908203125, -0.253631591796875, -0.2427825927734375, -0.23193359375, -0.2210845947265625, -0.210235595703125, -0.1993865966796875, -0.18853759765625, -0.1776885986328125, -0.166839599609375, -0.1559906005859375, -0.1451416015625, -0.1342926025390625, -0.123443603515625, -0.1125946044921875, -0.10174560546875, -0.0908966064453125, -0.080047607421875, -0.0691986083984375, -0.058349609375, -0.0475006103515625, -0.036651611328125, -0.0258026123046875, -0.01495361328125, -0.0041046142578125, 0.006744384765625, 0.0175933837890625, 0.0284423828125, 0.0392913818359375, 0.050140380859375, 0.0609893798828125, 0.07183837890625, 0.0826873779296875, 0.093536376953125, 0.1043853759765625, 0.115234375, 0.1260833740234375, 0.136932373046875, 0.1477813720703125, 0.15863037109375, 0.1694793701171875, 0.180328369140625, 0.1911773681640625, 0.2020263671875, 0.2128753662109375, 0.223724365234375, 0.2345733642578125, 0.24542236328125, 0.2562713623046875, 0.267120361328125, 0.2779693603515625, 0.288818359375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 10.0, 16.0, 16.0, 24.0, 36.0, 41.0, 56.0, 51.0, 64.0, 74.0, 77.0, 84.0, 63.0, 73.0, 69.0, 53.0, 32.0, 37.0, 32.0, 28.0, 25.0, 13.0, 3.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2481689453125, -0.2405071258544922, -0.23284530639648438, -0.22518348693847656, -0.21752166748046875, -0.20985984802246094, -0.20219802856445312, -0.1945362091064453, -0.1868743896484375, -0.1792125701904297, -0.17155075073242188, -0.16388893127441406, -0.15622711181640625, -0.14856529235839844, -0.14090347290039062, -0.1332416534423828, -0.125579833984375, -0.11791801452636719, -0.11025619506835938, -0.10259437561035156, -0.09493255615234375, -0.08727073669433594, -0.07960891723632812, -0.07194709777832031, -0.0642852783203125, -0.05662345886230469, -0.048961639404296875, -0.04129981994628906, -0.03363800048828125, -0.025976181030273438, -0.018314361572265625, -0.010652542114257812, -0.00299072265625, 0.0046710968017578125, 0.012332916259765625, 0.019994735717773438, 0.02765655517578125, 0.03531837463378906, 0.042980194091796875, 0.05064201354980469, 0.0583038330078125, 0.06596565246582031, 0.07362747192382812, 0.08128929138183594, 0.08895111083984375, 0.09661293029785156, 0.10427474975585938, 0.11193656921386719, 0.119598388671875, 0.1272602081298828, 0.13492202758789062, 0.14258384704589844, 0.15024566650390625, 0.15790748596191406, 0.16556930541992188, 0.1732311248779297, 0.1808929443359375, 0.1885547637939453, 0.19621658325195312, 0.20387840270996094, 0.21154022216796875, 0.21920204162597656, 0.22686386108398438, 0.2345256805419922, 0.2421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 13.0, 12.0, 27.0, 32.0, 40.0, 60.0, 73.0, 83.0, 139.0, 182.0, 260.0, 379.0, 664.0, 1171.0, 3018.0, 14622.0, 134781.0, 787043.0, 89598.0, 10775.0, 2605.0, 1056.0, 569.0, 407.0, 282.0, 166.0, 117.0, 82.0, 62.0, 68.0, 34.0, 27.0, 25.0, 17.0, 13.0, 9.0, 6.0, 3.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.415283203125, -0.40247344970703125, -0.3896636962890625, -0.37685394287109375, -0.364044189453125, -0.35123443603515625, -0.3384246826171875, -0.32561492919921875, -0.31280517578125, -0.29999542236328125, -0.2871856689453125, -0.27437591552734375, -0.261566162109375, -0.24875640869140625, -0.2359466552734375, -0.22313690185546875, -0.2103271484375, -0.19751739501953125, -0.1847076416015625, -0.17189788818359375, -0.159088134765625, -0.14627838134765625, -0.1334686279296875, -0.12065887451171875, -0.10784912109375, -0.09503936767578125, -0.0822296142578125, -0.06941986083984375, -0.056610107421875, -0.04380035400390625, -0.0309906005859375, -0.01818084716796875, -0.00537109375, 0.00743865966796875, 0.0202484130859375, 0.03305816650390625, 0.045867919921875, 0.05867767333984375, 0.0714874267578125, 0.08429718017578125, 0.09710693359375, 0.10991668701171875, 0.1227264404296875, 0.13553619384765625, 0.148345947265625, 0.16115570068359375, 0.1739654541015625, 0.18677520751953125, 0.1995849609375, 0.21239471435546875, 0.2252044677734375, 0.23801422119140625, 0.250823974609375, 0.26363372802734375, 0.2764434814453125, 0.28925323486328125, 0.30206298828125, 0.31487274169921875, 0.3276824951171875, 0.34049224853515625, 0.353302001953125, 0.36611175537109375, 0.3789215087890625, 0.39173126220703125, 0.404541015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 1.0, 3.0, 4.0, 15.0, 5.0, 12.0, 15.0, 15.0, 21.0, 41.0, 22.0, 39.0, 42.0, 57.0, 43.0, 58.0, 66.0, 67.0, 71.0, 63.0, 53.0, 41.0, 40.0, 36.0, 29.0, 35.0, 37.0, 16.0, 9.0, 7.0, 11.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.625, -0.6049728393554688, -0.5849456787109375, -0.5649185180664062, -0.544891357421875, -0.5248641967773438, -0.5048370361328125, -0.48480987548828125, -0.46478271484375, -0.44475555419921875, -0.4247283935546875, -0.40470123291015625, -0.384674072265625, -0.36464691162109375, -0.3446197509765625, -0.32459259033203125, -0.3045654296875, -0.28453826904296875, -0.2645111083984375, -0.24448394775390625, -0.224456787109375, -0.20442962646484375, -0.1844024658203125, -0.16437530517578125, -0.14434814453125, -0.12432098388671875, -0.1042938232421875, -0.08426666259765625, -0.064239501953125, -0.04421234130859375, -0.0241851806640625, -0.00415802001953125, 0.015869140625, 0.03589630126953125, 0.0559234619140625, 0.07595062255859375, 0.095977783203125, 0.11600494384765625, 0.1360321044921875, 0.15605926513671875, 0.17608642578125, 0.19611358642578125, 0.2161407470703125, 0.23616790771484375, 0.256195068359375, 0.27622222900390625, 0.2962493896484375, 0.31627655029296875, 0.3363037109375, 0.35633087158203125, 0.3763580322265625, 0.39638519287109375, 0.416412353515625, 0.43643951416015625, 0.4564666748046875, 0.47649383544921875, 0.49652099609375, 0.5165481567382812, 0.5365753173828125, 0.5566024780273438, 0.576629638671875, 0.5966567993164062, 0.6166839599609375, 0.6367111206054688, 0.65673828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 16.0, 28.0, 44.0, 62.0, 163.0, 287.0, 821.0, 2963.0, 16922.0, 191790.0, 786343.0, 41169.0, 5681.0, 1324.0, 463.0, 207.0, 98.0, 62.0, 30.0, 15.0, 15.0, 8.0, 8.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1942138671875, -0.18938350677490234, -0.1845531463623047, -0.17972278594970703, -0.17489242553710938, -0.17006206512451172, -0.16523170471191406, -0.1604013442993164, -0.15557098388671875, -0.1507406234741211, -0.14591026306152344, -0.14107990264892578, -0.13624954223632812, -0.13141918182373047, -0.1265888214111328, -0.12175846099853516, -0.1169281005859375, -0.11209774017333984, -0.10726737976074219, -0.10243701934814453, -0.09760665893554688, -0.09277629852294922, -0.08794593811035156, -0.0831155776977539, -0.07828521728515625, -0.0734548568725586, -0.06862449645996094, -0.06379413604736328, -0.058963775634765625, -0.05413341522216797, -0.04930305480957031, -0.044472694396972656, -0.039642333984375, -0.034811973571777344, -0.029981613159179688, -0.02515125274658203, -0.020320892333984375, -0.015490531921386719, -0.010660171508789062, -0.005829811096191406, -0.00099945068359375, 0.0038309097290039062, 0.008661270141601562, 0.013491630554199219, 0.018321990966796875, 0.02315235137939453, 0.027982711791992188, 0.032813072204589844, 0.0376434326171875, 0.042473793029785156, 0.04730415344238281, 0.05213451385498047, 0.056964874267578125, 0.06179523468017578, 0.06662559509277344, 0.0714559555053711, 0.07628631591796875, 0.0811166763305664, 0.08594703674316406, 0.09077739715576172, 0.09560775756835938, 0.10043811798095703, 0.10526847839355469, 0.11009883880615234, 0.11492919921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 2.0, 14.0, 11.0, 13.0, 21.0, 23.0, 26.0, 61.0, 86.0, 95.0, 84.0, 115.0, 89.0, 68.0, 64.0, 48.0, 51.0, 23.0, 20.0, 19.0, 19.0, 7.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3882598876953125e-05, -5.235709249973297e-05, -5.083158612251282e-05, -4.9306079745292664e-05, -4.778057336807251e-05, -4.6255066990852356e-05, -4.47295606136322e-05, -4.320405423641205e-05, -4.1678547859191895e-05, -4.015304148197174e-05, -3.862753510475159e-05, -3.710202872753143e-05, -3.557652235031128e-05, -3.4051015973091125e-05, -3.252550959587097e-05, -3.100000321865082e-05, -2.9474496841430664e-05, -2.794899046421051e-05, -2.6423484086990356e-05, -2.4897977709770203e-05, -2.337247133255005e-05, -2.1846964955329895e-05, -2.032145857810974e-05, -1.8795952200889587e-05, -1.7270445823669434e-05, -1.574493944644928e-05, -1.4219433069229126e-05, -1.2693926692008972e-05, -1.1168420314788818e-05, -9.642913937568665e-06, -8.11740756034851e-06, -6.591901183128357e-06, -5.066394805908203e-06, -3.5408884286880493e-06, -2.0153820514678955e-06, -4.898756742477417e-07, 1.0356307029724121e-06, 2.561137080192566e-06, 4.08664345741272e-06, 5.6121498346328735e-06, 7.137656211853027e-06, 8.663162589073181e-06, 1.0188668966293335e-05, 1.1714175343513489e-05, 1.3239681720733643e-05, 1.4765188097953796e-05, 1.629069447517395e-05, 1.7816200852394104e-05, 1.9341707229614258e-05, 2.086721360683441e-05, 2.2392719984054565e-05, 2.391822636127472e-05, 2.5443732738494873e-05, 2.6969239115715027e-05, 2.849474549293518e-05, 3.0020251870155334e-05, 3.154575824737549e-05, 3.307126462459564e-05, 3.4596771001815796e-05, 3.612227737903595e-05, 3.7647783756256104e-05, 3.917329013347626e-05, 4.069879651069641e-05, 4.2224302887916565e-05, 4.374980926513672e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 11.0, 3.0, 3.0, 15.0, 9.0, 23.0, 24.0, 32.0, 43.0, 74.0, 105.0, 152.0, 214.0, 368.0, 639.0, 1365.0, 3134.0, 8486.0, 28872.0, 125412.0, 687716.0, 143615.0, 32135.0, 9405.0, 3405.0, 1445.0, 713.0, 379.0, 233.0, 155.0, 93.0, 70.0, 62.0, 38.0, 30.0, 22.0, 12.0, 11.0, 10.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0836181640625, -0.08096694946289062, -0.07831573486328125, -0.07566452026367188, -0.0730133056640625, -0.07036209106445312, -0.06771087646484375, -0.06505966186523438, -0.062408447265625, -0.059757232666015625, -0.05710601806640625, -0.054454803466796875, -0.0518035888671875, -0.049152374267578125, -0.04650115966796875, -0.043849945068359375, -0.04119873046875, -0.038547515869140625, -0.03589630126953125, -0.033245086669921875, -0.0305938720703125, -0.027942657470703125, -0.02529144287109375, -0.022640228271484375, -0.019989013671875, -0.017337799072265625, -0.01468658447265625, -0.012035369873046875, -0.0093841552734375, -0.006732940673828125, -0.00408172607421875, -0.001430511474609375, 0.001220703125, 0.003871917724609375, 0.00652313232421875, 0.009174346923828125, 0.0118255615234375, 0.014476776123046875, 0.01712799072265625, 0.019779205322265625, 0.022430419921875, 0.025081634521484375, 0.02773284912109375, 0.030384063720703125, 0.0330352783203125, 0.035686492919921875, 0.03833770751953125, 0.040988922119140625, 0.04364013671875, 0.046291351318359375, 0.04894256591796875, 0.051593780517578125, 0.0542449951171875, 0.056896209716796875, 0.05954742431640625, 0.062198638916015625, 0.064849853515625, 0.06750106811523438, 0.07015228271484375, 0.07280349731445312, 0.0754547119140625, 0.07810592651367188, 0.08075714111328125, 0.08340835571289062, 0.0860595703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 8.0, 8.0, 11.0, 12.0, 19.0, 17.0, 21.0, 21.0, 43.0, 56.0, 77.0, 91.0, 100.0, 98.0, 98.0, 72.0, 49.0, 42.0, 40.0, 27.0, 25.0, 18.0, 8.0, 10.0, 3.0, 3.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.09019088745117188, -0.08718109130859375, -0.08417129516601562, -0.0811614990234375, -0.07815170288085938, -0.07514190673828125, -0.07213211059570312, -0.069122314453125, -0.06611251831054688, -0.06310272216796875, -0.060092926025390625, -0.0570831298828125, -0.054073333740234375, -0.05106353759765625, -0.048053741455078125, -0.0450439453125, -0.042034149169921875, -0.03902435302734375, -0.036014556884765625, -0.0330047607421875, -0.029994964599609375, -0.02698516845703125, -0.023975372314453125, -0.020965576171875, -0.017955780029296875, -0.01494598388671875, -0.011936187744140625, -0.0089263916015625, -0.005916595458984375, -0.00290679931640625, 0.000102996826171875, 0.00311279296875, 0.006122589111328125, 0.00913238525390625, 0.012142181396484375, 0.0151519775390625, 0.018161773681640625, 0.02117156982421875, 0.024181365966796875, 0.027191162109375, 0.030200958251953125, 0.03321075439453125, 0.036220550537109375, 0.0392303466796875, 0.042240142822265625, 0.04524993896484375, 0.048259735107421875, 0.05126953125, 0.054279327392578125, 0.05728912353515625, 0.060298919677734375, 0.0633087158203125, 0.06631851196289062, 0.06932830810546875, 0.07233810424804688, 0.075347900390625, 0.07835769653320312, 0.08136749267578125, 0.08437728881835938, 0.0873870849609375, 0.09039688110351562, 0.09340667724609375, 0.09641647338867188, 0.09942626953125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 12.0, 29.0, 133.0, 494.0, 239.0, 58.0, 15.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.761096477508545, -7.583735466003418, -7.406374931335449, -7.229013919830322, -7.051652908325195, -6.874292373657227, -6.6969313621521, -6.519570350646973, -6.342209815979004, -6.164848804473877, -5.987488269805908, -5.810127258300781, -5.6327667236328125, -5.4554057121276855, -5.278044700622559, -5.10068416595459, -4.923323154449463, -4.745962142944336, -4.568601608276367, -4.39124059677124, -4.213879585266113, -4.0365190505981445, -3.8591580390930176, -3.6817972660064697, -3.504436492919922, -3.327075719833374, -3.149714946746826, -2.972353935241699, -2.7949931621551514, -2.6176323890686035, -2.4402713775634766, -2.2629106044769287, -2.085550308227539, -1.9081895351409912, -1.7308286428451538, -1.5534677505493164, -1.3761069774627686, -1.1987462043762207, -1.0213853120803833, -0.8440244197845459, -0.666663646697998, -0.4893028140068054, -0.3119419813156128, -0.13458114862442017, 0.04277968406677246, 0.2201405167579651, 0.3975013494491577, 0.5748622417449951, 0.752223014831543, 0.9295838475227356, 1.1069446802139282, 1.2843055725097656, 1.4616663455963135, 1.6390271186828613, 1.8163880109786987, 1.9937489032745361, 2.171109676361084, 2.348470449447632, 2.5258312225341797, 2.7031922340393066, 2.8805530071258545, 3.0579137802124023, 3.2352747917175293, 3.412635564804077, 3.589996337890625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 3.0, 5.0, 5.0, 7.0, 10.0, 10.0, 14.0, 11.0, 18.0, 19.0, 13.0, 24.0, 31.0, 29.0, 32.0, 39.0, 52.0, 56.0, 99.0, 83.0, 72.0, 47.0, 34.0, 33.0, 29.0, 26.0, 24.0, 14.0, 23.0, 16.0, 16.0, 16.0, 12.0, 13.0, 9.0, 12.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6487575769424438, -1.5938482284545898, -1.5389389991760254, -1.4840296506881714, -1.4291203022003174, -1.374211072921753, -1.319301724433899, -1.264392375946045, -1.2094831466674805, -1.1545737981796265, -1.099664568901062, -1.044755220413208, -0.9898459315299988, -0.9349366426467896, -0.8800272941589355, -0.8251180052757263, -0.7702087163925171, -0.7152994275093079, -0.6603901386260986, -0.6054807901382446, -0.5505715012550354, -0.49566221237182617, -0.44075289368629456, -0.38584357500076294, -0.3309342861175537, -0.2760249972343445, -0.22111567854881287, -0.16620637476444244, -0.11129707098007202, -0.05638778209686279, -0.0014784634113311768, 0.05343085527420044, 0.10834002494812012, 0.16324932873249054, 0.21815863251686096, 0.2730679512023926, 0.3279772400856018, 0.38288652896881104, 0.43779584765434265, 0.49270516633987427, 0.5476144552230835, 0.6025237441062927, 0.657433032989502, 0.712342381477356, 0.7672516703605652, 0.8221609592437744, 0.8770703077316284, 0.9319795966148376, 0.9868888854980469, 1.0417982339859009, 1.0967074632644653, 1.1516168117523193, 1.2065260410308838, 1.2614353895187378, 1.3163447380065918, 1.3712539672851562, 1.4261633157730103, 1.4810726642608643, 1.5359818935394287, 1.5908912420272827, 1.6458005905151367, 1.7007098197937012, 1.7556191682815552, 1.8105285167694092, 1.8654377460479736]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 2.0, 3.0, 10.0, 14.0, 14.0, 25.0, 39.0, 59.0, 104.0, 194.0, 464.0, 1032.0, 3548.0, 19709.0, 313356.0, 3271640.0, 550302.0, 26952.0, 4550.0, 1224.0, 463.0, 243.0, 122.0, 73.0, 35.0, 30.0, 26.0, 7.0, 13.0, 8.0, 6.0, 3.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.25140380859375, -0.2415771484375, -0.23175048828125, -0.221923828125, -0.21209716796875, -0.2022705078125, -0.19244384765625, -0.1826171875, -0.17279052734375, -0.1629638671875, -0.15313720703125, -0.143310546875, -0.13348388671875, -0.1236572265625, -0.11383056640625, -0.10400390625, -0.09417724609375, -0.0843505859375, -0.07452392578125, -0.064697265625, -0.05487060546875, -0.0450439453125, -0.03521728515625, -0.025390625, -0.01556396484375, -0.0057373046875, 0.00408935546875, 0.013916015625, 0.02374267578125, 0.0335693359375, 0.04339599609375, 0.05322265625, 0.06304931640625, 0.0728759765625, 0.08270263671875, 0.092529296875, 0.10235595703125, 0.1121826171875, 0.12200927734375, 0.1318359375, 0.14166259765625, 0.1514892578125, 0.16131591796875, 0.171142578125, 0.18096923828125, 0.1907958984375, 0.20062255859375, 0.21044921875, 0.22027587890625, 0.2301025390625, 0.23992919921875, 0.249755859375, 0.25958251953125, 0.2694091796875, 0.27923583984375, 0.2890625, 0.29888916015625, 0.3087158203125, 0.31854248046875, 0.328369140625, 0.33819580078125, 0.3480224609375, 0.35784912109375, 0.36767578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 3.0, 7.0, 9.0, 14.0, 30.0, 30.0, 50.0, 62.0, 62.0, 66.0, 76.0, 89.0, 72.0, 61.0, 73.0, 81.0, 46.0, 42.0, 30.0, 29.0, 17.0, 19.0, 10.0, 8.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24883651733398438, -0.24108123779296875, -0.23332595825195312, -0.2255706787109375, -0.21781539916992188, -0.21006011962890625, -0.20230484008789062, -0.194549560546875, -0.18679428100585938, -0.17903900146484375, -0.17128372192382812, -0.1635284423828125, -0.15577316284179688, -0.14801788330078125, -0.14026260375976562, -0.13250732421875, -0.12475204467773438, -0.11699676513671875, -0.10924148559570312, -0.1014862060546875, -0.09373092651367188, -0.08597564697265625, -0.07822036743164062, -0.070465087890625, -0.06270980834960938, -0.05495452880859375, -0.047199249267578125, -0.0394439697265625, -0.031688690185546875, -0.02393341064453125, -0.016178131103515625, -0.0084228515625, -0.000667572021484375, 0.00708770751953125, 0.014842987060546875, 0.0225982666015625, 0.030353546142578125, 0.03810882568359375, 0.045864105224609375, 0.053619384765625, 0.061374664306640625, 0.06912994384765625, 0.07688522338867188, 0.0846405029296875, 0.09239578247070312, 0.10015106201171875, 0.10790634155273438, 0.11566162109375, 0.12341690063476562, 0.13117218017578125, 0.13892745971679688, 0.1466827392578125, 0.15443801879882812, 0.16219329833984375, 0.16994857788085938, 0.177703857421875, 0.18545913696289062, 0.19321441650390625, 0.20096969604492188, 0.2087249755859375, 0.21648025512695312, 0.22423553466796875, 0.23199081420898438, 0.23974609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 12.0, 10.0, 20.0, 18.0, 41.0, 66.0, 110.0, 235.0, 479.0, 1212.0, 4839.0, 40969.0, 2280726.0, 1823874.0, 35341.0, 4308.0, 1067.0, 439.0, 207.0, 101.0, 74.0, 35.0, 33.0, 19.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.330810546875, -0.3189849853515625, -0.307159423828125, -0.2953338623046875, -0.28350830078125, -0.2716827392578125, -0.259857177734375, -0.2480316162109375, -0.2362060546875, -0.2243804931640625, -0.212554931640625, -0.2007293701171875, -0.18890380859375, -0.1770782470703125, -0.165252685546875, -0.1534271240234375, -0.1416015625, -0.1297760009765625, -0.117950439453125, -0.1061248779296875, -0.09429931640625, -0.0824737548828125, -0.070648193359375, -0.0588226318359375, -0.0469970703125, -0.0351715087890625, -0.023345947265625, -0.0115203857421875, 0.00030517578125, 0.0121307373046875, 0.023956298828125, 0.0357818603515625, 0.047607421875, 0.0594329833984375, 0.071258544921875, 0.0830841064453125, 0.09490966796875, 0.1067352294921875, 0.118560791015625, 0.1303863525390625, 0.1422119140625, 0.1540374755859375, 0.165863037109375, 0.1776885986328125, 0.18951416015625, 0.2013397216796875, 0.213165283203125, 0.2249908447265625, 0.23681640625, 0.2486419677734375, 0.260467529296875, 0.2722930908203125, 0.28411865234375, 0.2959442138671875, 0.307769775390625, 0.3195953369140625, 0.3314208984375, 0.3432464599609375, 0.355072021484375, 0.3668975830078125, 0.37872314453125, 0.3905487060546875, 0.402374267578125, 0.4141998291015625, 0.426025390625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 4.0, 6.0, 18.0, 17.0, 25.0, 31.0, 42.0, 56.0, 72.0, 131.0, 239.0, 371.0, 460.0, 594.0, 543.0, 462.0, 342.0, 207.0, 150.0, 94.0, 54.0, 25.0, 29.0, 30.0, 22.0, 12.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238525390625, -0.23054885864257812, -0.22257232666015625, -0.21459579467773438, -0.2066192626953125, -0.19864273071289062, -0.19066619873046875, -0.18268966674804688, -0.174713134765625, -0.16673660278320312, -0.15876007080078125, -0.15078353881835938, -0.1428070068359375, -0.13483047485351562, -0.12685394287109375, -0.11887741088867188, -0.11090087890625, -0.10292434692382812, -0.09494781494140625, -0.08697128295898438, -0.0789947509765625, -0.07101821899414062, -0.06304168701171875, -0.055065155029296875, -0.047088623046875, -0.039112091064453125, -0.03113555908203125, -0.023159027099609375, -0.0151824951171875, -0.007205963134765625, 0.00077056884765625, 0.008747100830078125, 0.0167236328125, 0.024700164794921875, 0.03267669677734375, 0.040653228759765625, 0.0486297607421875, 0.056606292724609375, 0.06458282470703125, 0.07255935668945312, 0.080535888671875, 0.08851242065429688, 0.09648895263671875, 0.10446548461914062, 0.1124420166015625, 0.12041854858398438, 0.12839508056640625, 0.13637161254882812, 0.14434814453125, 0.15232467651367188, 0.16030120849609375, 0.16827774047851562, 0.1762542724609375, 0.18423080444335938, 0.19220733642578125, 0.20018386840820312, 0.208160400390625, 0.21613693237304688, 0.22411346435546875, 0.23208999633789062, 0.2400665283203125, 0.24804306030273438, 0.25601959228515625, 0.2639961242675781, 0.27197265625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 11.0, 12.0, 62.0, 142.0, 282.0, 255.0, 138.0, 63.0, 21.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2180449962615967, -3.0988314151763916, -2.9796178340911865, -2.8604042530059814, -2.7411906719207764, -2.6219770908355713, -2.502763271331787, -2.383549690246582, -2.264336109161377, -2.145122528076172, -2.025908946990967, -1.9066953659057617, -1.7874817848205566, -1.6682682037353516, -1.549054503440857, -1.4298409223556519, -1.3106274604797363, -1.1914138793945312, -1.0722002983093262, -0.9529866576194763, -0.8337730765342712, -0.7145594954490662, -0.5953458547592163, -0.47613227367401123, -0.35691869258880615, -0.23770509660243988, -0.11849150061607361, 0.0007221102714538574, 0.11993569135665894, 0.239149272441864, 0.35836291313171387, 0.47757649421691895, 0.5967898368835449, 0.71600341796875, 0.8352169990539551, 0.9544306397438049, 1.0736441612243652, 1.1928577423095703, 1.312071442604065, 1.43128502368927, 1.550498604774475, 1.6697121858596802, 1.7889257669448853, 1.9081394672393799, 2.027353048324585, 2.14656662940979, 2.265780210494995, 2.3849937915802, 2.5042073726654053, 2.6234209537506104, 2.7426345348358154, 2.8618481159210205, 2.9810616970062256, 3.1002752780914307, 3.219489097595215, 3.33870267868042, 3.457916259765625, 3.57712984085083, 3.696343421936035, 3.8155570030212402, 3.9347705841064453, 4.05398416519165, 4.1731977462768555, 4.2924113273620605, 4.411624908447266]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 10.0, 12.0, 8.0, 14.0, 19.0, 26.0, 21.0, 33.0, 44.0, 29.0, 46.0, 60.0, 54.0, 72.0, 73.0, 74.0, 63.0, 53.0, 36.0, 58.0, 27.0, 28.0, 26.0, 21.0, 17.0, 14.0, 12.0, 10.0, 9.0, 6.0, 2.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.88785982131958, -1.8361716270446777, -1.784483551979065, -1.7327953577041626, -1.6811072826385498, -1.6294190883636475, -1.5777310132980347, -1.5260428190231323, -1.4743547439575195, -1.4226665496826172, -1.3709784746170044, -1.319290280342102, -1.2676022052764893, -1.215914011001587, -1.1642259359359741, -1.1125377416610718, -1.060849666595459, -1.0091614723205566, -0.9574733972549438, -0.9057852625846863, -0.8540971279144287, -0.8024089336395264, -0.7507208585739136, -0.6990326642990112, -0.6473444700241089, -0.5956563353538513, -0.5439682006835938, -0.4922800660133362, -0.4405919313430786, -0.38890376687049866, -0.3372156322002411, -0.2855274975299835, -0.23383939266204834, -0.18215125799179077, -0.1304631233215332, -0.07877497375011444, -0.027086839079856873, 0.02460131049156189, 0.07628944516181946, 0.12797757983207703, 0.1796657145023346, 0.23135384917259216, 0.28304198384284973, 0.3347301483154297, 0.38641828298568726, 0.4381064176559448, 0.4897945523262024, 0.54148268699646, 0.5931708216667175, 0.6448589563369751, 0.6965470910072327, 0.7482352256774902, 0.7999233603477478, 0.8516114950180054, 0.9032996892929077, 0.9549877643585205, 1.0066759586334229, 1.0583641529083252, 1.110052227973938, 1.1617404222488403, 1.2134284973144531, 1.2651166915893555, 1.3168047666549683, 1.3684929609298706, 1.4201810359954834]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 4.0, 7.0, 24.0, 30.0, 32.0, 40.0, 92.0, 151.0, 241.0, 533.0, 1055.0, 2456.0, 6481.0, 22572.0, 115701.0, 600395.0, 242838.0, 39423.0, 10201.0, 3381.0, 1394.0, 684.0, 345.0, 181.0, 103.0, 76.0, 41.0, 26.0, 17.0, 8.0, 8.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.41552734375, -0.4042015075683594, -0.39287567138671875, -0.3815498352050781, -0.3702239990234375, -0.3588981628417969, -0.34757232666015625, -0.3362464904785156, -0.324920654296875, -0.3135948181152344, -0.30226898193359375, -0.2909431457519531, -0.2796173095703125, -0.2682914733886719, -0.25696563720703125, -0.24563980102539062, -0.23431396484375, -0.22298812866210938, -0.21166229248046875, -0.20033645629882812, -0.1890106201171875, -0.17768478393554688, -0.16635894775390625, -0.15503311157226562, -0.143707275390625, -0.13238143920898438, -0.12105560302734375, -0.10972976684570312, -0.0984039306640625, -0.08707809448242188, -0.07575225830078125, -0.06442642211914062, -0.0531005859375, -0.041774749755859375, -0.03044891357421875, -0.019123077392578125, -0.0077972412109375, 0.003528594970703125, 0.01485443115234375, 0.026180267333984375, 0.037506103515625, 0.048831939697265625, 0.06015777587890625, 0.07148361206054688, 0.0828094482421875, 0.09413528442382812, 0.10546112060546875, 0.11678695678710938, 0.12811279296875, 0.13943862915039062, 0.15076446533203125, 0.16209030151367188, 0.1734161376953125, 0.18474197387695312, 0.19606781005859375, 0.20739364624023438, 0.218719482421875, 0.23004531860351562, 0.24137115478515625, 0.2526969909667969, 0.2640228271484375, 0.2753486633300781, 0.28667449951171875, 0.2980003356933594, 0.309326171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 6.0, 11.0, 12.0, 16.0, 29.0, 36.0, 53.0, 54.0, 77.0, 66.0, 80.0, 64.0, 80.0, 83.0, 73.0, 59.0, 54.0, 31.0, 42.0, 18.0, 8.0, 15.0, 10.0, 10.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.248046875, -0.240234375, -0.232421875, -0.224609375, -0.216796875, -0.208984375, -0.201171875, -0.193359375, -0.185546875, -0.177734375, -0.169921875, -0.162109375, -0.154296875, -0.146484375, -0.138671875, -0.130859375, -0.123046875, -0.115234375, -0.107421875, -0.099609375, -0.091796875, -0.083984375, -0.076171875, -0.068359375, -0.060546875, -0.052734375, -0.044921875, -0.037109375, -0.029296875, -0.021484375, -0.013671875, -0.005859375, 0.001953125, 0.009765625, 0.017578125, 0.025390625, 0.033203125, 0.041015625, 0.048828125, 0.056640625, 0.064453125, 0.072265625, 0.080078125, 0.087890625, 0.095703125, 0.103515625, 0.111328125, 0.119140625, 0.126953125, 0.134765625, 0.142578125, 0.150390625, 0.158203125, 0.166015625, 0.173828125, 0.181640625, 0.189453125, 0.197265625, 0.205078125, 0.212890625, 0.220703125, 0.228515625, 0.236328125, 0.244140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 13.0, 14.0, 14.0, 28.0, 39.0, 62.0, 79.0, 117.0, 191.0, 256.0, 452.0, 768.0, 1545.0, 4550.0, 50053.0, 928984.0, 53125.0, 4647.0, 1550.0, 750.0, 474.0, 266.0, 179.0, 123.0, 73.0, 62.0, 40.0, 30.0, 20.0, 10.0, 13.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7041015625, -0.6842727661132812, -0.6644439697265625, -0.6446151733398438, -0.624786376953125, -0.6049575805664062, -0.5851287841796875, -0.5652999877929688, -0.54547119140625, -0.5256423950195312, -0.5058135986328125, -0.48598480224609375, -0.466156005859375, -0.44632720947265625, -0.4264984130859375, -0.40666961669921875, -0.3868408203125, -0.36701202392578125, -0.3471832275390625, -0.32735443115234375, -0.307525634765625, -0.28769683837890625, -0.2678680419921875, -0.24803924560546875, -0.22821044921875, -0.20838165283203125, -0.1885528564453125, -0.16872406005859375, -0.148895263671875, -0.12906646728515625, -0.1092376708984375, -0.08940887451171875, -0.069580078125, -0.04975128173828125, -0.0299224853515625, -0.01009368896484375, 0.009735107421875, 0.02956390380859375, 0.0493927001953125, 0.06922149658203125, 0.08905029296875, 0.10887908935546875, 0.1287078857421875, 0.14853668212890625, 0.168365478515625, 0.18819427490234375, 0.2080230712890625, 0.22785186767578125, 0.2476806640625, 0.26750946044921875, 0.2873382568359375, 0.30716705322265625, 0.326995849609375, 0.34682464599609375, 0.3666534423828125, 0.38648223876953125, 0.40631103515625, 0.42613983154296875, 0.4459686279296875, 0.46579742431640625, 0.485626220703125, 0.5054550170898438, 0.5252838134765625, 0.5451126098632812, 0.56494140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 3.0, 4.0, 6.0, 8.0, 12.0, 14.0, 14.0, 33.0, 32.0, 38.0, 46.0, 52.0, 57.0, 51.0, 71.0, 82.0, 70.0, 77.0, 52.0, 60.0, 35.0, 37.0, 35.0, 23.0, 22.0, 17.0, 13.0, 8.0, 8.0, 10.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5635757446289062, -0.5417022705078125, -0.5198287963867188, -0.497955322265625, -0.47608184814453125, -0.4542083740234375, -0.43233489990234375, -0.41046142578125, -0.38858795166015625, -0.3667144775390625, -0.34484100341796875, -0.322967529296875, -0.30109405517578125, -0.2792205810546875, -0.25734710693359375, -0.2354736328125, -0.21360015869140625, -0.1917266845703125, -0.16985321044921875, -0.147979736328125, -0.12610626220703125, -0.1042327880859375, -0.08235931396484375, -0.06048583984375, -0.03861236572265625, -0.0167388916015625, 0.00513458251953125, 0.027008056640625, 0.04888153076171875, 0.0707550048828125, 0.09262847900390625, 0.114501953125, 0.13637542724609375, 0.1582489013671875, 0.18012237548828125, 0.201995849609375, 0.22386932373046875, 0.2457427978515625, 0.26761627197265625, 0.28948974609375, 0.31136322021484375, 0.3332366943359375, 0.35511016845703125, 0.376983642578125, 0.39885711669921875, 0.4207305908203125, 0.44260406494140625, 0.4644775390625, 0.48635101318359375, 0.5082244873046875, 0.5300979614257812, 0.551971435546875, 0.5738449096679688, 0.5957183837890625, 0.6175918579101562, 0.63946533203125, 0.6613388061523438, 0.6832122802734375, 0.7050857543945312, 0.726959228515625, 0.7488327026367188, 0.7707061767578125, 0.7925796508789062, 0.814453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 5.0, 5.0, 2.0, 4.0, 12.0, 8.0, 6.0, 7.0, 19.0, 22.0, 26.0, 36.0, 66.0, 106.0, 156.0, 277.0, 630.0, 1945.0, 10421.0, 323096.0, 696171.0, 11843.0, 2168.0, 750.0, 301.0, 155.0, 80.0, 60.0, 52.0, 28.0, 19.0, 17.0, 7.0, 10.0, 7.0, 3.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2138671875, -0.20718955993652344, -0.20051193237304688, -0.1938343048095703, -0.18715667724609375, -0.1804790496826172, -0.17380142211914062, -0.16712379455566406, -0.1604461669921875, -0.15376853942871094, -0.14709091186523438, -0.1404132843017578, -0.13373565673828125, -0.1270580291748047, -0.12038040161132812, -0.11370277404785156, -0.107025146484375, -0.10034751892089844, -0.09366989135742188, -0.08699226379394531, -0.08031463623046875, -0.07363700866699219, -0.06695938110351562, -0.06028175354003906, -0.0536041259765625, -0.04692649841308594, -0.040248870849609375, -0.03357124328613281, -0.02689361572265625, -0.020215988159179688, -0.013538360595703125, -0.0068607330322265625, -0.00018310546875, 0.0064945220947265625, 0.013172149658203125, 0.019849777221679688, 0.02652740478515625, 0.03320503234863281, 0.039882659912109375, 0.04656028747558594, 0.0532379150390625, 0.05991554260253906, 0.06659317016601562, 0.07327079772949219, 0.07994842529296875, 0.08662605285644531, 0.09330368041992188, 0.09998130798339844, 0.106658935546875, 0.11333656311035156, 0.12001419067382812, 0.1266918182373047, 0.13336944580078125, 0.1400470733642578, 0.14672470092773438, 0.15340232849121094, 0.1600799560546875, 0.16675758361816406, 0.17343521118164062, 0.1801128387451172, 0.18679046630859375, 0.1934680938720703, 0.20014572143554688, 0.20682334899902344, 0.2135009765625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 13.0, 4.0, 7.0, 10.0, 9.0, 13.0, 19.0, 28.0, 28.0, 41.0, 70.0, 97.0, 121.0, 126.0, 101.0, 84.0, 60.0, 36.0, 22.0, 25.0, 14.0, 10.0, 14.0, 10.0, 7.0, 7.0, 7.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.70823860168457e-05, -8.492451161146164e-05, -8.276663720607758e-05, -8.060876280069351e-05, -7.845088839530945e-05, -7.629301398992538e-05, -7.413513958454132e-05, -7.197726517915726e-05, -6.98193907737732e-05, -6.766151636838913e-05, -6.550364196300507e-05, -6.3345767557621e-05, -6.118789315223694e-05, -5.9030018746852875e-05, -5.687214434146881e-05, -5.471426993608475e-05, -5.2556395530700684e-05, -5.039852112531662e-05, -4.8240646719932556e-05, -4.608277231454849e-05, -4.392489790916443e-05, -4.1767023503780365e-05, -3.96091490983963e-05, -3.745127469301224e-05, -3.5293400287628174e-05, -3.313552588224411e-05, -3.0977651476860046e-05, -2.8819777071475983e-05, -2.666190266609192e-05, -2.4504028260707855e-05, -2.234615385532379e-05, -2.0188279449939728e-05, -1.8030405044555664e-05, -1.58725306391716e-05, -1.3714656233787537e-05, -1.1556781828403473e-05, -9.39890742301941e-06, -7.2410330176353455e-06, -5.083158612251282e-06, -2.925284206867218e-06, -7.674098014831543e-07, 1.3904646039009094e-06, 3.548339009284973e-06, 5.706213414669037e-06, 7.8640878200531e-06, 1.0021962225437164e-05, 1.2179836630821228e-05, 1.4337711036205292e-05, 1.6495585441589355e-05, 1.865345984697342e-05, 2.0811334252357483e-05, 2.2969208657741547e-05, 2.512708306312561e-05, 2.7284957468509674e-05, 2.9442831873893738e-05, 3.16007062792778e-05, 3.3758580684661865e-05, 3.591645509004593e-05, 3.807432949542999e-05, 4.0232203900814056e-05, 4.239007830619812e-05, 4.4547952711582184e-05, 4.670582711696625e-05, 4.886370152235031e-05, 5.1021575927734375e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 13.0, 26.0, 28.0, 32.0, 53.0, 69.0, 107.0, 212.0, 333.0, 766.0, 1861.0, 6638.0, 44071.0, 859691.0, 118687.0, 11114.0, 2738.0, 1017.0, 472.0, 211.0, 121.0, 75.0, 51.0, 19.0, 22.0, 13.0, 17.0, 15.0, 13.0, 16.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1497802734375, -0.14533233642578125, -0.1408843994140625, -0.13643646240234375, -0.131988525390625, -0.12754058837890625, -0.1230926513671875, -0.11864471435546875, -0.11419677734375, -0.10974884033203125, -0.1053009033203125, -0.10085296630859375, -0.096405029296875, -0.09195709228515625, -0.0875091552734375, -0.08306121826171875, -0.07861328125, -0.07416534423828125, -0.0697174072265625, -0.06526947021484375, -0.060821533203125, -0.05637359619140625, -0.0519256591796875, -0.04747772216796875, -0.04302978515625, -0.03858184814453125, -0.0341339111328125, -0.02968597412109375, -0.025238037109375, -0.02079010009765625, -0.0163421630859375, -0.01189422607421875, -0.0074462890625, -0.00299835205078125, 0.0014495849609375, 0.00589752197265625, 0.010345458984375, 0.01479339599609375, 0.0192413330078125, 0.02368927001953125, 0.02813720703125, 0.03258514404296875, 0.0370330810546875, 0.04148101806640625, 0.045928955078125, 0.05037689208984375, 0.0548248291015625, 0.05927276611328125, 0.063720703125, 0.06816864013671875, 0.0726165771484375, 0.07706451416015625, 0.081512451171875, 0.08596038818359375, 0.0904083251953125, 0.09485626220703125, 0.09930419921875, 0.10375213623046875, 0.1082000732421875, 0.11264801025390625, 0.117095947265625, 0.12154388427734375, 0.1259918212890625, 0.13043975830078125, 0.1348876953125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 12.0, 17.0, 16.0, 27.0, 46.0, 58.0, 95.0, 131.0, 163.0, 116.0, 91.0, 77.0, 34.0, 32.0, 19.0, 7.0, 8.0, 4.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14802932739257812, -0.14395904541015625, -0.13988876342773438, -0.1358184814453125, -0.13174819946289062, -0.12767791748046875, -0.12360763549804688, -0.119537353515625, -0.11546707153320312, -0.11139678955078125, -0.10732650756835938, -0.1032562255859375, -0.09918594360351562, -0.09511566162109375, -0.09104537963867188, -0.08697509765625, -0.08290481567382812, -0.07883453369140625, -0.07476425170898438, -0.0706939697265625, -0.06662368774414062, -0.06255340576171875, -0.058483123779296875, -0.054412841796875, -0.050342559814453125, -0.04627227783203125, -0.042201995849609375, -0.0381317138671875, -0.034061431884765625, -0.02999114990234375, -0.025920867919921875, -0.0218505859375, -0.017780303955078125, -0.01371002197265625, -0.009639739990234375, -0.0055694580078125, -0.001499176025390625, 0.00257110595703125, 0.006641387939453125, 0.010711669921875, 0.014781951904296875, 0.01885223388671875, 0.022922515869140625, 0.0269927978515625, 0.031063079833984375, 0.03513336181640625, 0.039203643798828125, 0.04327392578125, 0.047344207763671875, 0.05141448974609375, 0.055484771728515625, 0.0595550537109375, 0.06362533569335938, 0.06769561767578125, 0.07176589965820312, 0.075836181640625, 0.07990646362304688, 0.08397674560546875, 0.08804702758789062, 0.0921173095703125, 0.09618759155273438, 0.10025787353515625, 0.10432815551757812, 0.1083984375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 38.0, 269.0, 605.0, 54.0, 11.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.463346481323242, -11.2151460647583, -10.96694564819336, -10.718745231628418, -10.470544815063477, -10.222344398498535, -9.974143981933594, -9.725943565368652, -9.477743148803711, -9.22954273223877, -8.981342315673828, -8.733141899108887, -8.484941482543945, -8.236741065979004, -7.9885406494140625, -7.740340232849121, -7.49213981628418, -7.243939399719238, -6.995738983154297, -6.7475385665893555, -6.499338150024414, -6.251137733459473, -6.002937316894531, -5.75473690032959, -5.50653600692749, -5.258335590362549, -5.010135173797607, -4.761934757232666, -4.513734340667725, -4.265533924102783, -4.017333507537842, -3.7691330909729004, -3.520932674407959, -3.2727322578430176, -3.024531841278076, -2.7763314247131348, -2.5281310081481934, -2.279930591583252, -2.0317301750183105, -1.7835296392440796, -1.5353292226791382, -1.2871288061141968, -1.0389283895492554, -0.7907279133796692, -0.5425274968147278, -0.2943270206451416, -0.046126604080200195, 0.2020738124847412, 0.4502742290496826, 0.698474645614624, 0.9466750621795654, 1.1948754787445068, 1.4430758953094482, 1.6912764310836792, 1.9394768476486206, 2.1876773834228516, 2.435877799987793, 2.6840782165527344, 2.932278633117676, 3.180479049682617, 3.4286794662475586, 3.6768798828125, 3.9250802993774414, 4.173280715942383, 4.421481132507324]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 6.0, 4.0, 7.0, 10.0, 13.0, 7.0, 14.0, 13.0, 20.0, 22.0, 26.0, 28.0, 36.0, 51.0, 41.0, 90.0, 183.0, 104.0, 44.0, 45.0, 38.0, 30.0, 32.0, 28.0, 25.0, 15.0, 10.0, 18.0, 7.0, 10.0, 9.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0799918174743652, -2.0016672611236572, -1.9233425855636597, -1.845017910003662, -1.766693353652954, -1.688368797302246, -1.6100441217422485, -1.531719446182251, -1.453394889831543, -1.375070333480835, -1.2967456579208374, -1.2184209823608398, -1.1400964260101318, -1.0617718696594238, -0.9834471940994263, -0.9051225781440735, -0.8267979621887207, -0.7484733462333679, -0.6701487302780151, -0.5918241143226624, -0.5134994983673096, -0.4351748824119568, -0.356850266456604, -0.2785256505012512, -0.20020103454589844, -0.12187641859054565, -0.04355180263519287, 0.03477281332015991, 0.1130974292755127, 0.19142204523086548, 0.26974666118621826, 0.34807127714157104, 0.4263956546783447, 0.5047202706336975, 0.5830448865890503, 0.6613695025444031, 0.7396941184997559, 0.8180187344551086, 0.8963433504104614, 0.9746679663658142, 1.052992582321167, 1.131317138671875, 1.2096418142318726, 1.2879664897918701, 1.3662910461425781, 1.4446156024932861, 1.5229402780532837, 1.6012649536132812, 1.6795895099639893, 1.7579140663146973, 1.8362387418746948, 1.9145634174346924, 1.9928879737854004, 2.0712125301361084, 2.1495370864868164, 2.2278618812561035, 2.3061864376068115, 2.3845109939575195, 2.4628357887268066, 2.5411603450775146, 2.6194849014282227, 2.6978094577789307, 2.7761340141296387, 2.854458808898926, 2.932783365249634]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 12.0, 11.0, 32.0, 30.0, 49.0, 86.0, 173.0, 290.0, 606.0, 1249.0, 3444.0, 12647.0, 87590.0, 1131623.0, 2569648.0, 346927.0, 29322.0, 6534.0, 2161.0, 895.0, 385.0, 215.0, 128.0, 69.0, 40.0, 30.0, 29.0, 13.0, 7.0, 3.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.269775390625, -0.25988006591796875, -0.2499847412109375, -0.24008941650390625, -0.230194091796875, -0.22029876708984375, -0.2104034423828125, -0.20050811767578125, -0.19061279296875, -0.18071746826171875, -0.1708221435546875, -0.16092681884765625, -0.151031494140625, -0.14113616943359375, -0.1312408447265625, -0.12134552001953125, -0.1114501953125, -0.10155487060546875, -0.0916595458984375, -0.08176422119140625, -0.071868896484375, -0.06197357177734375, -0.0520782470703125, -0.04218292236328125, -0.03228759765625, -0.02239227294921875, -0.0124969482421875, -0.00260162353515625, 0.007293701171875, 0.01718902587890625, 0.0270843505859375, 0.03697967529296875, 0.046875, 0.05677032470703125, 0.0666656494140625, 0.07656097412109375, 0.086456298828125, 0.09635162353515625, 0.1062469482421875, 0.11614227294921875, 0.12603759765625, 0.13593292236328125, 0.1458282470703125, 0.15572357177734375, 0.165618896484375, 0.17551422119140625, 0.1854095458984375, 0.19530487060546875, 0.2052001953125, 0.21509552001953125, 0.2249908447265625, 0.23488616943359375, 0.244781494140625, 0.25467681884765625, 0.2645721435546875, 0.27446746826171875, 0.28436279296875, 0.29425811767578125, 0.3041534423828125, 0.31404876708984375, 0.323944091796875, 0.33383941650390625, 0.3437347412109375, 0.35363006591796875, 0.363525390625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 9.0, 15.0, 20.0, 31.0, 37.0, 52.0, 59.0, 74.0, 70.0, 70.0, 82.0, 88.0, 84.0, 72.0, 55.0, 38.0, 43.0, 22.0, 18.0, 9.0, 11.0, 12.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24914169311523438, -0.24144744873046875, -0.23375320434570312, -0.2260589599609375, -0.21836471557617188, -0.21067047119140625, -0.20297622680664062, -0.195281982421875, -0.18758773803710938, -0.17989349365234375, -0.17219924926757812, -0.1645050048828125, -0.15681076049804688, -0.14911651611328125, -0.14142227172851562, -0.13372802734375, -0.12603378295898438, -0.11833953857421875, -0.11064529418945312, -0.1029510498046875, -0.09525680541992188, -0.08756256103515625, -0.07986831665039062, -0.072174072265625, -0.06447982788085938, -0.05678558349609375, -0.049091339111328125, -0.0413970947265625, -0.033702850341796875, -0.02600860595703125, -0.018314361572265625, -0.0106201171875, -0.002925872802734375, 0.00476837158203125, 0.012462615966796875, 0.0201568603515625, 0.027851104736328125, 0.03554534912109375, 0.043239593505859375, 0.050933837890625, 0.058628082275390625, 0.06632232666015625, 0.07401657104492188, 0.0817108154296875, 0.08940505981445312, 0.09709930419921875, 0.10479354858398438, 0.11248779296875, 0.12018203735351562, 0.12787628173828125, 0.13557052612304688, 0.1432647705078125, 0.15095901489257812, 0.15865325927734375, 0.16634750366210938, 0.174041748046875, 0.18173599243164062, 0.18943023681640625, 0.19712448120117188, 0.2048187255859375, 0.21251296997070312, 0.22020721435546875, 0.22790145874023438, 0.235595703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 4.0, 5.0, 10.0, 7.0, 13.0, 29.0, 40.0, 53.0, 85.0, 150.0, 337.0, 796.0, 2110.0, 12138.0, 3662971.0, 503794.0, 8334.0, 1941.0, 703.0, 342.0, 162.0, 97.0, 52.0, 39.0, 22.0, 15.0, 13.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0703125, -1.0367279052734375, -1.003143310546875, -0.9695587158203125, -0.93597412109375, -0.9023895263671875, -0.868804931640625, -0.8352203369140625, -0.8016357421875, -0.7680511474609375, -0.734466552734375, -0.7008819580078125, -0.66729736328125, -0.6337127685546875, -0.600128173828125, -0.5665435791015625, -0.532958984375, -0.4993743896484375, -0.465789794921875, -0.4322052001953125, -0.39862060546875, -0.3650360107421875, -0.331451416015625, -0.2978668212890625, -0.2642822265625, -0.2306976318359375, -0.197113037109375, -0.1635284423828125, -0.12994384765625, -0.0963592529296875, -0.062774658203125, -0.0291900634765625, 0.00439453125, 0.0379791259765625, 0.071563720703125, 0.1051483154296875, 0.13873291015625, 0.1723175048828125, 0.205902099609375, 0.2394866943359375, 0.2730712890625, 0.3066558837890625, 0.340240478515625, 0.3738250732421875, 0.40740966796875, 0.4409942626953125, 0.474578857421875, 0.5081634521484375, 0.541748046875, 0.5753326416015625, 0.608917236328125, 0.6425018310546875, 0.67608642578125, 0.7096710205078125, 0.743255615234375, 0.7768402099609375, 0.8104248046875, 0.8440093994140625, 0.877593994140625, 0.9111785888671875, 0.94476318359375, 0.9783477783203125, 1.011932373046875, 1.0455169677734375, 1.0791015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 5.0, 12.0, 31.0, 68.0, 107.0, 193.0, 379.0, 755.0, 919.0, 674.0, 400.0, 198.0, 118.0, 70.0, 39.0, 30.0, 20.0, 18.0, 6.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.5830078125, -0.55908203125, -0.53515625, -0.51123046875, -0.4873046875, -0.46337890625, -0.439453125, -0.41552734375, -0.3916015625, -0.36767578125, -0.34375, -0.31982421875, -0.2958984375, -0.27197265625, -0.248046875, -0.22412109375, -0.2001953125, -0.17626953125, -0.15234375, -0.12841796875, -0.1044921875, -0.08056640625, -0.056640625, -0.03271484375, -0.0087890625, 0.01513671875, 0.0390625, 0.06298828125, 0.0869140625, 0.11083984375, 0.134765625, 0.15869140625, 0.1826171875, 0.20654296875, 0.23046875, 0.25439453125, 0.2783203125, 0.30224609375, 0.326171875, 0.35009765625, 0.3740234375, 0.39794921875, 0.421875, 0.44580078125, 0.4697265625, 0.49365234375, 0.517578125, 0.54150390625, 0.5654296875, 0.58935546875, 0.61328125, 0.63720703125, 0.6611328125, 0.68505859375, 0.708984375, 0.73291015625, 0.7568359375, 0.78076171875, 0.8046875, 0.82861328125, 0.8525390625, 0.87646484375, 0.900390625, 0.92431640625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 19.0, 41.0, 184.0, 400.0, 207.0, 71.0, 27.0, 14.0, 9.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7272138595581055, -3.363909959793091, -3.000606060028076, -2.6373021602630615, -2.273998260498047, -1.9106943607330322, -1.5473904609680176, -1.184086561203003, -0.8207826614379883, -0.45747876167297363, -0.09417486190795898, 0.26912903785705566, 0.6324329376220703, 0.995736837387085, 1.3590407371520996, 1.7223446369171143, 2.085648536682129, 2.4489524364471436, 2.812256336212158, 3.175560235977173, 3.5388641357421875, 3.902168035507202, 4.265471935272217, 4.628775596618652, 4.992079734802246, 5.35538387298584, 5.718687534332275, 6.081991195678711, 6.445295333862305, 6.808599472045898, 7.171903133392334, 7.5352067947387695, 7.898509979248047, 8.26181411743164, 8.625118255615234, 8.988421440124512, 9.351725578308105, 9.7150297164917, 10.078332901000977, 10.44163703918457, 10.804941177368164, 11.168245315551758, 11.531549453735352, 11.894852638244629, 12.258156776428223, 12.621460914611816, 12.984764099121094, 13.348068237304688, 13.711372375488281, 14.074676513671875, 14.437980651855469, 14.801283836364746, 15.16458797454834, 15.527892112731934, 15.891195297241211, 16.254499435424805, 16.6178035736084, 16.981107711791992, 17.344411849975586, 17.70771598815918, 18.07101821899414, 18.434322357177734, 18.797626495361328, 19.160930633544922, 19.524234771728516]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 1.0, 2.0, 7.0, 6.0, 12.0, 10.0, 14.0, 24.0, 42.0, 40.0, 41.0, 62.0, 53.0, 85.0, 85.0, 89.0, 100.0, 71.0, 49.0, 48.0, 39.0, 32.0, 18.0, 12.0, 16.0, 15.0, 8.0, 5.0, 8.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.228280067443848, -4.069037437438965, -3.909795045852661, -3.7505526542663574, -3.5913100242614746, -3.432067394256592, -3.272825002670288, -3.1135826110839844, -2.9543399810791016, -2.7950973510742188, -2.635854959487915, -2.4766125679016113, -2.3173699378967285, -2.1581273078918457, -1.998884916305542, -1.8396424055099487, -1.6803998947143555, -1.5211573839187622, -1.361914873123169, -1.2026723623275757, -1.0434298515319824, -0.8841873407363892, -0.7249448299407959, -0.5657023191452026, -0.4064598083496094, -0.2472172975540161, -0.08797478675842285, 0.07126772403717041, 0.23051023483276367, 0.38975274562835693, 0.5489952564239502, 0.7082377672195435, 0.8674802780151367, 1.02672278881073, 1.1859652996063232, 1.3452078104019165, 1.5044503211975098, 1.663692831993103, 1.8229353427886963, 1.9821778535842896, 2.141420364379883, 2.3006629943847656, 2.4599053859710693, 2.619147777557373, 2.778390407562256, 2.9376330375671387, 3.0968754291534424, 3.256117820739746, 3.415360450744629, 3.5746030807495117, 3.7338454723358154, 3.893087863922119, 4.052330493927002, 4.211573123931885, 4.370815277099609, 4.530057907104492, 4.689300537109375, 4.848543167114258, 5.007785797119141, 5.167027950286865, 5.326270580291748, 5.485513210296631, 5.6447553634643555, 5.803997993469238, 5.963240623474121]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 5.0, 7.0, 16.0, 24.0, 52.0, 71.0, 91.0, 181.0, 292.0, 603.0, 1397.0, 3445.0, 9769.0, 38503.0, 286642.0, 623168.0, 62477.0, 13858.0, 4615.0, 1715.0, 731.0, 375.0, 176.0, 109.0, 87.0, 40.0, 25.0, 22.0, 12.0, 9.0, 4.0, 12.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3310546875, -0.3207550048828125, -0.310455322265625, -0.3001556396484375, -0.28985595703125, -0.2795562744140625, -0.269256591796875, -0.2589569091796875, -0.2486572265625, -0.2383575439453125, -0.228057861328125, -0.2177581787109375, -0.20745849609375, -0.1971588134765625, -0.186859130859375, -0.1765594482421875, -0.166259765625, -0.1559600830078125, -0.145660400390625, -0.1353607177734375, -0.12506103515625, -0.1147613525390625, -0.104461669921875, -0.0941619873046875, -0.0838623046875, -0.0735626220703125, -0.063262939453125, -0.0529632568359375, -0.04266357421875, -0.0323638916015625, -0.022064208984375, -0.0117645263671875, -0.00146484375, 0.0088348388671875, 0.019134521484375, 0.0294342041015625, 0.03973388671875, 0.0500335693359375, 0.060333251953125, 0.0706329345703125, 0.0809326171875, 0.0912322998046875, 0.101531982421875, 0.1118316650390625, 0.12213134765625, 0.1324310302734375, 0.142730712890625, 0.1530303955078125, 0.163330078125, 0.1736297607421875, 0.183929443359375, 0.1942291259765625, 0.20452880859375, 0.2148284912109375, 0.225128173828125, 0.2354278564453125, 0.2457275390625, 0.2560272216796875, 0.266326904296875, 0.2766265869140625, 0.28692626953125, 0.2972259521484375, 0.307525634765625, 0.3178253173828125, 0.328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 13.0, 24.0, 32.0, 35.0, 57.0, 63.0, 82.0, 76.0, 92.0, 87.0, 83.0, 68.0, 71.0, 45.0, 52.0, 43.0, 20.0, 12.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.24055862426757812, -0.22965240478515625, -0.21874618530273438, -0.2078399658203125, -0.19693374633789062, -0.18602752685546875, -0.17512130737304688, -0.164215087890625, -0.15330886840820312, -0.14240264892578125, -0.13149642944335938, -0.1205902099609375, -0.10968399047851562, -0.09877777099609375, -0.08787155151367188, -0.07696533203125, -0.06605911254882812, -0.05515289306640625, -0.044246673583984375, -0.0333404541015625, -0.022434234619140625, -0.01152801513671875, -0.000621795654296875, 0.010284423828125, 0.021190643310546875, 0.03209686279296875, 0.043003082275390625, 0.0539093017578125, 0.06481552124023438, 0.07572174072265625, 0.08662796020507812, 0.0975341796875, 0.10844039916992188, 0.11934661865234375, 0.13025283813476562, 0.1411590576171875, 0.15206527709960938, 0.16297149658203125, 0.17387771606445312, 0.184783935546875, 0.19569015502929688, 0.20659637451171875, 0.21750259399414062, 0.2284088134765625, 0.23931503295898438, 0.25022125244140625, 0.2611274719238281, 0.27203369140625, 0.2829399108886719, 0.29384613037109375, 0.3047523498535156, 0.3156585693359375, 0.3265647888183594, 0.33747100830078125, 0.3483772277832031, 0.359283447265625, 0.3701896667480469, 0.38109588623046875, 0.3920021057128906, 0.4029083251953125, 0.4138145446777344, 0.42472076416015625, 0.4356269836425781, 0.446533203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 5.0, 9.0, 21.0, 30.0, 40.0, 59.0, 66.0, 112.0, 158.0, 324.0, 586.0, 1390.0, 5097.0, 48773.0, 943722.0, 40878.0, 4572.0, 1323.0, 521.0, 326.0, 174.0, 117.0, 67.0, 54.0, 45.0, 19.0, 10.0, 10.0, 9.0, 7.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.428955078125, -0.4153251647949219, -0.40169525146484375, -0.3880653381347656, -0.3744354248046875, -0.3608055114746094, -0.34717559814453125, -0.3335456848144531, -0.319915771484375, -0.3062858581542969, -0.29265594482421875, -0.2790260314941406, -0.2653961181640625, -0.2517662048339844, -0.23813629150390625, -0.22450637817382812, -0.21087646484375, -0.19724655151367188, -0.18361663818359375, -0.16998672485351562, -0.1563568115234375, -0.14272689819335938, -0.12909698486328125, -0.11546707153320312, -0.101837158203125, -0.08820724487304688, -0.07457733154296875, -0.060947418212890625, -0.0473175048828125, -0.033687591552734375, -0.02005767822265625, -0.006427764892578125, 0.0072021484375, 0.020832061767578125, 0.03446197509765625, 0.048091888427734375, 0.0617218017578125, 0.07535171508789062, 0.08898162841796875, 0.10261154174804688, 0.116241455078125, 0.12987136840820312, 0.14350128173828125, 0.15713119506835938, 0.1707611083984375, 0.18439102172851562, 0.19802093505859375, 0.21165084838867188, 0.22528076171875, 0.23891067504882812, 0.25254058837890625, 0.2661705017089844, 0.2798004150390625, 0.2934303283691406, 0.30706024169921875, 0.3206901550292969, 0.334320068359375, 0.3479499816894531, 0.36157989501953125, 0.3752098083496094, 0.3888397216796875, 0.4024696350097656, 0.41609954833984375, 0.4297294616699219, 0.443359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 6.0, 7.0, 4.0, 8.0, 5.0, 10.0, 10.0, 2.0, 18.0, 16.0, 24.0, 30.0, 39.0, 42.0, 56.0, 52.0, 76.0, 67.0, 83.0, 57.0, 65.0, 47.0, 42.0, 39.0, 27.0, 22.0, 16.0, 16.0, 19.0, 17.0, 9.0, 13.0, 9.0, 6.0, 3.0, 6.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.72265625, -0.7010116577148438, -0.6793670654296875, -0.6577224731445312, -0.636077880859375, -0.6144332885742188, -0.5927886962890625, -0.5711441040039062, -0.54949951171875, -0.5278549194335938, -0.5062103271484375, -0.48456573486328125, -0.462921142578125, -0.44127655029296875, -0.4196319580078125, -0.39798736572265625, -0.3763427734375, -0.35469818115234375, -0.3330535888671875, -0.31140899658203125, -0.289764404296875, -0.26811981201171875, -0.2464752197265625, -0.22483062744140625, -0.20318603515625, -0.18154144287109375, -0.1598968505859375, -0.13825225830078125, -0.116607666015625, -0.09496307373046875, -0.0733184814453125, -0.05167388916015625, -0.030029296875, -0.00838470458984375, 0.0132598876953125, 0.03490447998046875, 0.056549072265625, 0.07819366455078125, 0.0998382568359375, 0.12148284912109375, 0.14312744140625, 0.16477203369140625, 0.1864166259765625, 0.20806121826171875, 0.229705810546875, 0.25135040283203125, 0.2729949951171875, 0.29463958740234375, 0.3162841796875, 0.33792877197265625, 0.3595733642578125, 0.38121795654296875, 0.402862548828125, 0.42450714111328125, 0.4461517333984375, 0.46779632568359375, 0.48944091796875, 0.5110855102539062, 0.5327301025390625, 0.5543746948242188, 0.576019287109375, 0.5976638793945312, 0.6193084716796875, 0.6409530639648438, 0.66259765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 11.0, 10.0, 15.0, 28.0, 18.0, 30.0, 51.0, 79.0, 104.0, 168.0, 248.0, 429.0, 872.0, 1800.0, 4956.0, 19461.0, 212000.0, 773846.0, 24317.0, 5807.0, 2042.0, 966.0, 479.0, 240.0, 159.0, 120.0, 78.0, 46.0, 52.0, 29.0, 23.0, 13.0, 10.0, 10.0, 7.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05438232421875, -0.05257368087768555, -0.050765037536621094, -0.04895639419555664, -0.04714775085449219, -0.045339107513427734, -0.04353046417236328, -0.04172182083129883, -0.039913177490234375, -0.03810453414916992, -0.03629589080810547, -0.034487247467041016, -0.03267860412597656, -0.03086996078491211, -0.029061317443847656, -0.027252674102783203, -0.02544403076171875, -0.023635387420654297, -0.021826744079589844, -0.02001810073852539, -0.018209457397460938, -0.016400814056396484, -0.014592170715332031, -0.012783527374267578, -0.010974884033203125, -0.009166240692138672, -0.007357597351074219, -0.005548954010009766, -0.0037403106689453125, -0.0019316673278808594, -0.00012302398681640625, 0.0016856193542480469, 0.0034942626953125, 0.005302906036376953, 0.007111549377441406, 0.00892019271850586, 0.010728836059570312, 0.012537479400634766, 0.014346122741699219, 0.016154766082763672, 0.017963409423828125, 0.019772052764892578, 0.02158069610595703, 0.023389339447021484, 0.025197982788085938, 0.02700662612915039, 0.028815269470214844, 0.030623912811279297, 0.03243255615234375, 0.0342411994934082, 0.036049842834472656, 0.03785848617553711, 0.03966712951660156, 0.041475772857666016, 0.04328441619873047, 0.04509305953979492, 0.046901702880859375, 0.04871034622192383, 0.05051898956298828, 0.052327632904052734, 0.05413627624511719, 0.05594491958618164, 0.057753562927246094, 0.05956220626831055, 0.061370849609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 7.0, 3.0, 10.0, 16.0, 24.0, 26.0, 51.0, 49.0, 57.0, 80.0, 84.0, 93.0, 92.0, 86.0, 67.0, 56.0, 33.0, 35.0, 28.0, 13.0, 16.0, 16.0, 6.0, 9.0, 7.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4809112548828125e-05, -3.34596261382103e-05, -3.211013972759247e-05, -3.076065331697464e-05, -2.941116690635681e-05, -2.8061680495738983e-05, -2.6712194085121155e-05, -2.5362707674503326e-05, -2.4013221263885498e-05, -2.266373485326767e-05, -2.131424844264984e-05, -1.9964762032032013e-05, -1.8615275621414185e-05, -1.7265789210796356e-05, -1.5916302800178528e-05, -1.45668163895607e-05, -1.3217329978942871e-05, -1.1867843568325043e-05, -1.0518357157707214e-05, -9.168870747089386e-06, -7.819384336471558e-06, -6.469897925853729e-06, -5.120411515235901e-06, -3.7709251046180725e-06, -2.421438694000244e-06, -1.0719522833824158e-06, 2.775341272354126e-07, 1.627020537853241e-06, 2.9765069484710693e-06, 4.325993359088898e-06, 5.675479769706726e-06, 7.0249661803245544e-06, 8.374452590942383e-06, 9.723939001560211e-06, 1.107342541217804e-05, 1.2422911822795868e-05, 1.3772398233413696e-05, 1.5121884644031525e-05, 1.6471371054649353e-05, 1.782085746526718e-05, 1.917034387588501e-05, 2.0519830286502838e-05, 2.1869316697120667e-05, 2.3218803107738495e-05, 2.4568289518356323e-05, 2.591777592897415e-05, 2.726726233959198e-05, 2.861674875020981e-05, 2.9966235160827637e-05, 3.1315721571445465e-05, 3.2665207982063293e-05, 3.401469439268112e-05, 3.536418080329895e-05, 3.671366721391678e-05, 3.806315362453461e-05, 3.9412640035152435e-05, 4.0762126445770264e-05, 4.211161285638809e-05, 4.346109926700592e-05, 4.481058567762375e-05, 4.616007208824158e-05, 4.7509558498859406e-05, 4.8859044909477234e-05, 5.020853132009506e-05, 5.155801773071289e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 1.0, 7.0, 5.0, 7.0, 12.0, 13.0, 19.0, 24.0, 29.0, 39.0, 58.0, 79.0, 141.0, 153.0, 274.0, 447.0, 740.0, 1268.0, 2408.0, 4994.0, 10902.0, 28721.0, 120816.0, 773195.0, 67366.0, 20038.0, 8184.0, 3890.0, 1934.0, 1082.0, 601.0, 353.0, 240.0, 163.0, 96.0, 73.0, 48.0, 33.0, 28.0, 13.0, 16.0, 11.0, 18.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0308990478515625, -0.029880285263061523, -0.028861522674560547, -0.02784276008605957, -0.026823997497558594, -0.025805234909057617, -0.02478647232055664, -0.023767709732055664, -0.022748947143554688, -0.02173018455505371, -0.020711421966552734, -0.019692659378051758, -0.01867389678955078, -0.017655134201049805, -0.016636371612548828, -0.015617609024047852, -0.014598846435546875, -0.013580083847045898, -0.012561321258544922, -0.011542558670043945, -0.010523796081542969, -0.009505033493041992, -0.008486270904541016, -0.007467508316040039, -0.0064487457275390625, -0.005429983139038086, -0.004411220550537109, -0.003392457962036133, -0.0023736953735351562, -0.0013549327850341797, -0.0003361701965332031, 0.0006825923919677734, 0.00170135498046875, 0.0027201175689697266, 0.003738880157470703, 0.00475764274597168, 0.005776405334472656, 0.006795167922973633, 0.00781393051147461, 0.008832693099975586, 0.009851455688476562, 0.010870218276977539, 0.011888980865478516, 0.012907743453979492, 0.013926506042480469, 0.014945268630981445, 0.015964031219482422, 0.0169827938079834, 0.018001556396484375, 0.01902031898498535, 0.020039081573486328, 0.021057844161987305, 0.02207660675048828, 0.023095369338989258, 0.024114131927490234, 0.02513289451599121, 0.026151657104492188, 0.027170419692993164, 0.02818918228149414, 0.029207944869995117, 0.030226707458496094, 0.03124547004699707, 0.03226423263549805, 0.03328299522399902, 0.0343017578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 3.0, 3.0, 5.0, 10.0, 10.0, 9.0, 14.0, 12.0, 28.0, 32.0, 43.0, 79.0, 133.0, 171.0, 136.0, 96.0, 60.0, 46.0, 27.0, 11.0, 14.0, 13.0, 7.0, 8.0, 5.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.06182575225830078, -0.05980873107910156, -0.057791709899902344, -0.055774688720703125, -0.053757667541503906, -0.05174064636230469, -0.04972362518310547, -0.04770660400390625, -0.04568958282470703, -0.04367256164550781, -0.041655540466308594, -0.039638519287109375, -0.037621498107910156, -0.03560447692871094, -0.03358745574951172, -0.0315704345703125, -0.02955341339111328, -0.027536392211914062, -0.025519371032714844, -0.023502349853515625, -0.021485328674316406, -0.019468307495117188, -0.01745128631591797, -0.01543426513671875, -0.013417243957519531, -0.011400222778320312, -0.009383201599121094, -0.007366180419921875, -0.005349159240722656, -0.0033321380615234375, -0.0013151168823242188, 0.000701904296875, 0.0027189254760742188, 0.0047359466552734375, 0.006752967834472656, 0.008769989013671875, 0.010787010192871094, 0.012804031372070312, 0.014821052551269531, 0.01683807373046875, 0.01885509490966797, 0.020872116088867188, 0.022889137268066406, 0.024906158447265625, 0.026923179626464844, 0.028940200805664062, 0.03095722198486328, 0.0329742431640625, 0.03499126434326172, 0.03700828552246094, 0.039025306701660156, 0.041042327880859375, 0.043059349060058594, 0.04507637023925781, 0.04709339141845703, 0.04911041259765625, 0.05112743377685547, 0.05314445495605469, 0.055161476135253906, 0.057178497314453125, 0.059195518493652344, 0.06121253967285156, 0.06322956085205078, 0.06524658203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 13.0, 28.0, 39.0, 62.0, 156.0, 540.0, 77.0, 38.0, 16.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0018630027771, -4.896159648895264, -4.790456295013428, -4.684752464294434, -4.579049110412598, -4.473345756530762, -4.367642402648926, -4.26193904876709, -4.156235694885254, -4.050532341003418, -3.944828748703003, -3.839125394821167, -3.733421802520752, -3.627718448638916, -3.52201509475708, -3.416311740875244, -3.31060791015625, -3.204904556274414, -3.099200963973999, -2.993497610092163, -2.887794017791748, -2.782090663909912, -2.676387310028076, -2.5706839561462402, -2.464980363845825, -2.3592770099639893, -2.253573417663574, -2.1478700637817383, -2.0421667098999023, -1.9364631175994873, -1.8307597637176514, -1.7250562906265259, -1.6193530559539795, -1.513649582862854, -1.4079461097717285, -1.3022427558898926, -1.196539282798767, -1.0908358097076416, -0.9851323962211609, -0.8794289827346802, -0.7737255096435547, -0.6680220365524292, -0.5623186230659485, -0.4566151797771454, -0.3509117364883423, -0.2452082633972168, -0.13950484991073608, -0.03380143642425537, 0.07190203666687012, 0.17760547995567322, 0.2833089232444763, 0.3890123665332794, 0.4947158098220825, 0.600419282913208, 0.7061226963996887, 0.8118261098861694, 0.9175295829772949, 1.0232330560684204, 1.128936529159546, 1.2346398830413818, 1.3403433561325073, 1.4460468292236328, 1.5517501831054688, 1.6574536561965942, 1.7631571292877197]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 4.0, 1.0, 5.0, 3.0, 10.0, 7.0, 13.0, 11.0, 20.0, 14.0, 16.0, 19.0, 23.0, 33.0, 26.0, 37.0, 89.0, 324.0, 104.0, 26.0, 18.0, 21.0, 26.0, 23.0, 26.0, 23.0, 23.0, 8.0, 11.0, 6.0, 6.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5587775707244873, -2.4887776374816895, -2.4187777042388916, -2.3487777709960938, -2.278778076171875, -2.208778142929077, -2.1387782096862793, -2.0687782764434814, -1.9987783432006836, -1.9287784099578857, -1.858778476715088, -1.7887786626815796, -1.7187787294387817, -1.6487787961959839, -1.5787789821624756, -1.5087790489196777, -1.4387791156768799, -1.368779182434082, -1.2987792491912842, -1.2287794351577759, -1.158779501914978, -1.0887795686721802, -1.0187797546386719, -0.948779821395874, -0.8787798881530762, -0.8087799549102783, -0.7387800812721252, -0.6687802076339722, -0.5987802743911743, -0.5287803411483765, -0.4587804675102234, -0.3887805640697479, -0.31878089904785156, -0.2487809956073761, -0.17878109216690063, -0.10878118872642517, -0.03878128528594971, 0.031218618154525757, 0.10121852159500122, 0.17121842503547668, 0.24121832847595215, 0.3112182319164276, 0.3812181353569031, 0.45121803879737854, 0.521217942237854, 0.5912178754806519, 0.6612177491188049, 0.731217622756958, 0.8012175559997559, 0.8712174892425537, 0.9412173628807068, 1.0112172365188599, 1.0812171697616577, 1.1512171030044556, 1.2212169170379639, 1.2912168502807617, 1.3612167835235596, 1.4312167167663574, 1.5012166500091553, 1.5712164640426636, 1.6412163972854614, 1.7112163305282593, 1.7812161445617676, 1.8512160778045654, 1.9212160110473633]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 16.0, 22.0, 34.0, 37.0, 48.0, 70.0, 211.0, 260.0, 69.0, 59.0, 41.0, 33.0, 24.0, 23.0, 10.0, 9.0, 5.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.2168598175048828, -0.20654678344726562, -0.19623374938964844, -0.18592071533203125, -0.17560768127441406, -0.16529464721679688, -0.1549816131591797, -0.1446685791015625, -0.1343555450439453, -0.12404251098632812, -0.11372947692871094, -0.10341644287109375, -0.09310340881347656, -0.08279037475585938, -0.07247734069824219, -0.062164306640625, -0.05185127258300781, -0.041538238525390625, -0.031225204467773438, -0.02091217041015625, -0.010599136352539062, -0.000286102294921875, 0.010026931762695312, 0.0203399658203125, 0.030652999877929688, 0.040966033935546875, 0.05127906799316406, 0.06159210205078125, 0.07190513610839844, 0.08221817016601562, 0.09253120422363281, 0.10284423828125, 0.11315727233886719, 0.12347030639648438, 0.13378334045410156, 0.14409637451171875, 0.15440940856933594, 0.16472244262695312, 0.1750354766845703, 0.1853485107421875, 0.1956615447998047, 0.20597457885742188, 0.21628761291503906, 0.22660064697265625, 0.23691368103027344, 0.24722671508789062, 0.2575397491455078, 0.267852783203125, 0.2781658172607422, 0.2884788513183594, 0.29879188537597656, 0.30910491943359375, 0.31941795349121094, 0.3297309875488281, 0.3400440216064453, 0.3503570556640625, 0.3606700897216797, 0.3709831237792969, 0.38129615783691406, 0.39160919189453125, 0.40192222595214844, 0.4122352600097656, 0.4225482940673828, 0.432861328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 11.0, 10.0, 5.0, 16.0, 14.0, 20.0, 33.0, 24.0, 62.0, 171.0, 443.0, 2900.0, 8365785.0, 17554.0, 986.0, 260.0, 105.0, 52.0, 9.0, 10.0, 40.0, 14.0, 5.0, 18.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 5.0], "bins": [-3.53940749168396, -3.42431902885437, -3.3092308044433594, -3.1941423416137695, -3.079054117202759, -2.963965654373169, -2.848877429962158, -2.7337889671325684, -2.6187005043029785, -2.5036120414733887, -2.388523817062378, -2.273435354232788, -2.1583471298217773, -2.0432586669921875, -1.9281703233718872, -1.813081979751587, -1.6979937553405762, -1.5829054117202759, -1.4678170680999756, -1.3527286052703857, -1.237640380859375, -1.1225519180297852, -1.0074635744094849, -0.8923752307891846, -0.7772868871688843, -0.662198543548584, -0.5471101999282837, -0.4320217967033386, -0.31693345308303833, -0.20184510946273804, -0.08675670623779297, 0.028331637382507324, 0.14341998100280762, 0.2585083246231079, 0.3735966980457306, 0.48868507146835327, 0.6037734150886536, 0.7188617587089539, 0.8339501619338989, 0.9490385055541992, 1.0641268491744995, 1.1792151927947998, 1.2943035364151, 1.4093918800354004, 1.5244803428649902, 1.639568567276001, 1.7546570301055908, 1.8697453737258911, 1.9848337173461914, 2.0999221801757812, 2.215010404586792, 2.330098867416382, 2.4451870918273926, 2.5602755546569824, 2.6753640174865723, 2.790452241897583, 2.9055404663085938, 3.0206289291381836, 3.1357171535491943, 3.250805616378784, 3.365893840789795, 3.4809823036193848, 3.5960707664489746, 3.7111589908599854, 3.826247453689575]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 1.0, 11.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.611243963241577, -2.531331777572632, -2.4514195919036865, -2.3715076446533203, -2.291595458984375, -2.2116832733154297, -2.1317710876464844, -2.051858901977539, -1.9719469547271729, -1.8920347690582275, -1.8121227025985718, -1.7322105169296265, -1.6522984504699707, -1.5723862648010254, -1.49247407913208, -1.4125620126724243, -1.332649827003479, -1.2527376413345337, -1.172825574874878, -1.0929133892059326, -1.0130013227462769, -0.9330891370773315, -0.853177011013031, -0.7732648849487305, -0.6933527588844299, -0.6134406328201294, -0.5335285067558289, -0.45361635088920593, -0.3737042248249054, -0.29379209876060486, -0.21387994289398193, -0.1339678168296814, -0.05405569076538086, 0.025856442749500275, 0.10576857626438141, 0.18568071722984314, 0.2655928432941437, 0.3455049693584442, 0.42541712522506714, 0.5053292512893677, 0.5852413773536682, 0.6651535034179688, 0.7450656294822693, 0.8249777555465698, 0.9048899412155151, 0.9848020076751709, 1.0647141933441162, 1.1446263790130615, 1.2245384454727173, 1.3044506311416626, 1.3843626976013184, 1.4642748832702637, 1.5441869497299194, 1.6240991353988647, 1.7040112018585205, 1.7839233875274658, 1.8638355731964111, 1.9437477588653564, 2.0236599445343018, 2.103571891784668, 2.1834840774536133, 2.2633962631225586, 2.343308448791504, 2.423220634460449, 2.5031325817108154]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 17.0, 6.0, 28.0, 35.0, 44.0, 61.0, 96.0, 147.0, 211.0, 439.0, 1019.0, 3458.0, 15066.0, 86356.0, 302223.0, 93687.0, 15754.0, 3320.0, 1056.0, 464.0, 243.0, 163.0, 111.0, 71.0, 56.0, 33.0, 14.0, 20.0, 14.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.245391845703125, -2.18218994140625, -2.118988037109375, -2.0557861328125, -1.992584228515625, -1.92938232421875, -1.866180419921875, -1.802978515625, -1.739776611328125, -1.67657470703125, -1.613372802734375, -1.5501708984375, -1.486968994140625, -1.42376708984375, -1.360565185546875, -1.29736328125, -1.234161376953125, -1.17095947265625, -1.107757568359375, -1.0445556640625, -0.981353759765625, -0.91815185546875, -0.854949951171875, -0.791748046875, -0.728546142578125, -0.66534423828125, -0.602142333984375, -0.5389404296875, -0.475738525390625, -0.41253662109375, -0.349334716796875, -0.2861328125, -0.222930908203125, -0.15972900390625, -0.096527099609375, -0.0333251953125, 0.029876708984375, 0.09307861328125, 0.156280517578125, 0.219482421875, 0.282684326171875, 0.34588623046875, 0.409088134765625, 0.4722900390625, 0.535491943359375, 0.59869384765625, 0.661895751953125, 0.72509765625, 0.788299560546875, 0.85150146484375, 0.914703369140625, 0.9779052734375, 1.041107177734375, 1.10430908203125, 1.167510986328125, 1.230712890625, 1.293914794921875, 1.35711669921875, 1.420318603515625, 1.4835205078125, 1.546722412109375, 1.60992431640625, 1.673126220703125, 1.736328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 6.0, 8.0, 12.0, 18.0, 20.0, 38.0, 34.0, 41.0, 60.0, 62.0, 104.0, 112.0, 98.0, 99.0, 73.0, 51.0, 37.0, 19.0, 24.0, 23.0, 16.0, 10.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3095703125, -0.298492431640625, -0.28741455078125, -0.276336669921875, -0.2652587890625, -0.254180908203125, -0.24310302734375, -0.232025146484375, -0.220947265625, -0.209869384765625, -0.19879150390625, -0.187713623046875, -0.1766357421875, -0.165557861328125, -0.15447998046875, -0.143402099609375, -0.13232421875, -0.121246337890625, -0.11016845703125, -0.099090576171875, -0.0880126953125, -0.076934814453125, -0.06585693359375, -0.054779052734375, -0.043701171875, -0.032623291015625, -0.02154541015625, -0.010467529296875, 0.0006103515625, 0.011688232421875, 0.02276611328125, 0.033843994140625, 0.044921875, 0.055999755859375, 0.06707763671875, 0.078155517578125, 0.0892333984375, 0.100311279296875, 0.11138916015625, 0.122467041015625, 0.133544921875, 0.144622802734375, 0.15570068359375, 0.166778564453125, 0.1778564453125, 0.188934326171875, 0.20001220703125, 0.211090087890625, 0.22216796875, 0.233245849609375, 0.24432373046875, 0.255401611328125, 0.2664794921875, 0.277557373046875, 0.28863525390625, 0.299713134765625, 0.310791015625, 0.321868896484375, 0.33294677734375, 0.344024658203125, 0.3551025390625, 0.366180419921875, 0.37725830078125, 0.388336181640625, 0.3994140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 23.0, 37.0, 87.0, 102.0, 107.0, 54.0, 17.0, 18.0, 4.0, 7.0, 2.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6309139728546143, -1.5468950271606445, -1.4628762006759644, -1.3788572549819946, -1.294838309288025, -1.2108194828033447, -1.126800537109375, -1.0427815914154053, -0.9587627053260803, -0.8747438192367554, -0.7907248735427856, -0.7067059874534607, -0.6226871013641357, -0.538668155670166, -0.45464926958084106, -0.37063032388687134, -0.2866114377975464, -0.20259252190589905, -0.1185736209154129, -0.03455471992492676, 0.04946419596672058, 0.13348311185836792, 0.21750199794769287, 0.3015209436416626, 0.38553982973098755, 0.4695587456226349, 0.5535776615142822, 0.6375965476036072, 0.7216154336929321, 0.8056343793869019, 0.8896532654762268, 0.9736722111701965, 1.0576910972595215, 1.1417100429534912, 1.2257288694381714, 1.3097478151321411, 1.3937667608261108, 1.477785587310791, 1.5618045330047607, 1.6458234786987305, 1.7298424243927002, 1.81386137008667, 1.89788019657135, 1.9818991422653198, 2.06591796875, 2.1499369144439697, 2.2339558601379395, 2.317974805831909, 2.401993751525879, 2.4860126972198486, 2.5700316429138184, 2.654050350189209, 2.7380692958831787, 2.8220882415771484, 2.906107187271118, 2.990126132965088, 3.0741448402404785, 3.1581637859344482, 3.242182731628418, 3.3262014389038086, 3.4102203845977783, 3.494239330291748, 3.5782582759857178, 3.6622772216796875, 3.7462961673736572]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 9.0, 8.0, 13.0, 29.0, 44.0, 49.0, 68.0, 67.0, 78.0, 35.0, 15.0, 18.0, 14.0, 3.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.592702627182007, -2.52793288230896, -2.463163375854492, -2.3983936309814453, -2.3336238861083984, -2.2688541412353516, -2.204084634780884, -2.139314889907837, -2.074545383453369, -2.0097756385803223, -1.945006012916565, -1.8802363872528076, -1.8154666423797607, -1.7506970167160034, -1.685927391052246, -1.6211576461791992, -1.5563879013061523, -1.491618275642395, -1.4268485307693481, -1.3620789051055908, -1.297309160232544, -1.2325395345687866, -1.1677699089050293, -1.1030001640319824, -1.038230538368225, -0.973460853099823, -0.9086911678314209, -0.8439215421676636, -0.7791518568992615, -0.7143821716308594, -0.649612545967102, -0.5848428606987, -0.5200729370117188, -0.45530325174331665, -0.39053359627723694, -0.3257639408111572, -0.2609942555427551, -0.19622457027435303, -0.13145491480827332, -0.0666852593421936, -0.001915574073791504, 0.0628540962934494, 0.1276237666606903, 0.1923934370279312, 0.2571631073951721, 0.3219327926635742, 0.38670244812965393, 0.45147210359573364, 0.5162417888641357, 0.5810114741325378, 0.6457811594009399, 0.7105507850646973, 0.7753204703330994, 0.8400901556015015, 0.9048597812652588, 0.9696294665336609, 1.034399151802063, 1.0991687774658203, 1.1639385223388672, 1.2287081480026245, 1.2934777736663818, 1.3582475185394287, 1.423017144203186, 1.4877867698669434, 1.5525565147399902]}, "eval/loss": 4.200125694274902, "eval/wer": 1.9598968663228877, "eval/runtime": 786.8447, "eval/samples_per_second": 3.358, "eval/steps_per_second": 0.281, "train/train_runtime": 5718.4377, "train/train_samples_per_second": 4.991, "train/train_steps_per_second": 0.104, "train/total_flos": 0.0, "train/train_loss": 4.336673439953865} \ No newline at end of file +{"train/loss": 4.4907, "train/learning_rate": 3.1914893617021275e-07, "train/epoch": 1.0, "train/global_step": 594, "_runtime": 6953, "_timestamp": 1646081192, "_step": 596, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 10.0, 548.0, 448.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.368497848510742, -13.00784683227539, -8.647195816040039, -4.2865447998046875, 0.07410621643066406, 4.434757232666016, 8.795408248901367, 13.156059265136719, 17.51671028137207, 21.877361297607422, 26.238012313842773, 30.598663330078125, 34.959312438964844, 39.31996536254883, 43.68061828613281, 48.04126739501953, 52.40191650390625, 56.76256561279297, 61.12321853637695, 65.48387145996094, 69.84452056884766, 74.20516967773438, 78.56582641601562, 82.92647552490234, 87.28712463378906, 91.64777374267578, 96.0084228515625, 100.36907958984375, 104.72972869873047, 109.09037780761719, 113.45103454589844, 117.81168365478516, 122.17233276367188, 126.5329818725586, 130.8936309814453, 135.25428771972656, 139.61492919921875, 143.9755859375, 148.33624267578125, 152.69688415527344, 157.0575408935547, 161.41819763183594, 165.77883911132812, 170.13949584960938, 174.50015258789062, 178.8607940673828, 183.22145080566406, 187.58209228515625, 191.9427490234375, 196.30340576171875, 200.66404724121094, 205.0247039794922, 209.38534545898438, 213.74600219726562, 218.10665893554688, 222.46730041503906, 226.8279571533203, 231.18861389160156, 235.54925537109375, 239.909912109375, 244.27056884765625, 248.63121032714844, 252.9918670654297, 257.3525085449219, 261.7131652832031]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 11.0, 7.0, 6.0, 16.0, 13.0, 18.0, 20.0, 23.0, 27.0, 29.0, 25.0, 36.0, 44.0, 38.0, 33.0, 30.0, 39.0, 56.0, 53.0, 59.0, 39.0, 36.0, 41.0, 37.0, 33.0, 35.0, 27.0, 23.0, 28.0, 28.0, 21.0, 13.0, 16.0, 5.0, 5.0, 10.0, 4.0, 2.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.572723388671875, -20.85820770263672, -20.143692016601562, -19.429176330566406, -18.71466064453125, -18.00014305114746, -17.285627365112305, -16.57111167907715, -15.856595993041992, -15.142080307006836, -14.42756462097168, -13.713047981262207, -12.99853229522705, -12.284016609191895, -11.569499969482422, -10.854984283447266, -10.14046859741211, -9.425952911376953, -8.711437225341797, -7.996920585632324, -7.282404899597168, -6.567889213562012, -5.853373050689697, -5.138856887817383, -4.424341201782227, -3.709825277328491, -2.995309352874756, -2.2807934284210205, -1.5662775039672852, -0.8517615795135498, -0.13724565505981445, 0.5772705078125, 1.2917861938476562, 2.0063021183013916, 2.720818042755127, 3.4353339672088623, 4.149849891662598, 4.864365577697754, 5.578881740570068, 6.293397903442383, 7.007913589477539, 7.722429275512695, 8.436944961547852, 9.151461601257324, 9.86597728729248, 10.580492973327637, 11.29500961303711, 12.009525299072266, 12.724040985107422, 13.438556671142578, 14.153072357177734, 14.867588996887207, 15.582104682922363, 16.296621322631836, 17.011137008666992, 17.72565269470215, 18.440168380737305, 19.15468406677246, 19.869199752807617, 20.583715438842773, 21.298233032226562, 22.01274871826172, 22.727264404296875, 23.44178009033203, 24.156295776367188]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 3.0, 8.0, 11.0, 10.0, 16.0, 22.0, 17.0, 19.0, 23.0, 36.0, 22.0, 35.0, 33.0, 30.0, 43.0, 39.0, 48.0, 41.0, 45.0, 49.0, 46.0, 42.0, 34.0, 30.0, 45.0, 35.0, 27.0, 33.0, 26.0, 30.0, 17.0, 16.0, 13.0, 6.0, 9.0, 5.0, 9.0, 10.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.1525115966796875, -1.114593505859375, -1.0766754150390625, -1.03875732421875, -1.0008392333984375, -0.962921142578125, -0.9250030517578125, -0.8870849609375, -0.8491668701171875, -0.811248779296875, -0.7733306884765625, -0.73541259765625, -0.6974945068359375, -0.659576416015625, -0.6216583251953125, -0.583740234375, -0.5458221435546875, -0.507904052734375, -0.4699859619140625, -0.43206787109375, -0.3941497802734375, -0.356231689453125, -0.3183135986328125, -0.2803955078125, -0.2424774169921875, -0.204559326171875, -0.1666412353515625, -0.12872314453125, -0.0908050537109375, -0.052886962890625, -0.0149688720703125, 0.02294921875, 0.0608673095703125, 0.098785400390625, 0.1367034912109375, 0.17462158203125, 0.2125396728515625, 0.250457763671875, 0.2883758544921875, 0.3262939453125, 0.3642120361328125, 0.402130126953125, 0.4400482177734375, 0.47796630859375, 0.5158843994140625, 0.553802490234375, 0.5917205810546875, 0.629638671875, 0.6675567626953125, 0.705474853515625, 0.7433929443359375, 0.78131103515625, 0.8192291259765625, 0.857147216796875, 0.8950653076171875, 0.9329833984375, 0.9709014892578125, 1.008819580078125, 1.0467376708984375, 1.08465576171875, 1.1225738525390625, 1.160491943359375, 1.1984100341796875, 1.236328125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 9.0, 9.0, 24.0, 24.0, 33.0, 36.0, 57.0, 95.0, 129.0, 192.0, 308.0, 504.0, 775.0, 1315.0, 2239.0, 4421.0, 11468.0, 39459.0, 231150.0, 2016112.0, 1650216.0, 182969.0, 33397.0, 10070.0, 4090.0, 2023.0, 1151.0, 684.0, 434.0, 304.0, 161.0, 139.0, 71.0, 53.0, 40.0, 27.0, 16.0, 17.0, 9.0, 9.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-3.978515625, -3.861297607421875, -3.74407958984375, -3.626861572265625, -3.5096435546875, -3.392425537109375, -3.27520751953125, -3.157989501953125, -3.040771484375, -2.923553466796875, -2.80633544921875, -2.689117431640625, -2.5718994140625, -2.454681396484375, -2.33746337890625, -2.220245361328125, -2.10302734375, -1.985809326171875, -1.86859130859375, -1.751373291015625, -1.6341552734375, -1.516937255859375, -1.39971923828125, -1.282501220703125, -1.165283203125, -1.048065185546875, -0.93084716796875, -0.813629150390625, -0.6964111328125, -0.579193115234375, -0.46197509765625, -0.344757080078125, -0.2275390625, -0.110321044921875, 0.00689697265625, 0.124114990234375, 0.2413330078125, 0.358551025390625, 0.47576904296875, 0.592987060546875, 0.710205078125, 0.827423095703125, 0.94464111328125, 1.061859130859375, 1.1790771484375, 1.296295166015625, 1.41351318359375, 1.530731201171875, 1.64794921875, 1.765167236328125, 1.88238525390625, 1.999603271484375, 2.1168212890625, 2.234039306640625, 2.35125732421875, 2.468475341796875, 2.585693359375, 2.702911376953125, 2.82012939453125, 2.937347412109375, 3.0545654296875, 3.171783447265625, 3.28900146484375, 3.406219482421875, 3.5234375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 20.0, 42.0, 64.0, 79.0, 143.0, 234.0, 413.0, 711.0, 810.0, 625.0, 349.0, 214.0, 124.0, 92.0, 54.0, 22.0, 21.0, 17.0, 11.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.62384033203125, -7.4078369140625, -7.19183349609375, -6.975830078125, -6.75982666015625, -6.5438232421875, -6.32781982421875, -6.11181640625, -5.89581298828125, -5.6798095703125, -5.46380615234375, -5.247802734375, -5.03179931640625, -4.8157958984375, -4.59979248046875, -4.3837890625, -4.16778564453125, -3.9517822265625, -3.73577880859375, -3.519775390625, -3.30377197265625, -3.0877685546875, -2.87176513671875, -2.65576171875, -2.43975830078125, -2.2237548828125, -2.00775146484375, -1.791748046875, -1.57574462890625, -1.3597412109375, -1.14373779296875, -0.927734375, -0.71173095703125, -0.4957275390625, -0.27972412109375, -0.063720703125, 0.15228271484375, 0.3682861328125, 0.58428955078125, 0.80029296875, 1.01629638671875, 1.2322998046875, 1.44830322265625, 1.664306640625, 1.88031005859375, 2.0963134765625, 2.31231689453125, 2.5283203125, 2.74432373046875, 2.9603271484375, 3.17633056640625, 3.392333984375, 3.60833740234375, 3.8243408203125, 4.04034423828125, 4.25634765625, 4.47235107421875, 4.6883544921875, 4.90435791015625, 5.120361328125, 5.33636474609375, 5.5523681640625, 5.76837158203125, 5.984375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 6.0, 18.0, 21.0, 35.0, 81.0, 168.0, 287.0, 534.0, 1220.0, 3921.0, 70392.0, 4064315.0, 47327.0, 3595.0, 1183.0, 491.0, 299.0, 137.0, 85.0, 63.0, 28.0, 18.0, 7.0, 8.0, 8.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.046875, -22.358154296875, -21.66943359375, -20.980712890625, -20.2919921875, -19.603271484375, -18.91455078125, -18.225830078125, -17.537109375, -16.848388671875, -16.15966796875, -15.470947265625, -14.7822265625, -14.093505859375, -13.40478515625, -12.716064453125, -12.02734375, -11.338623046875, -10.64990234375, -9.961181640625, -9.2724609375, -8.583740234375, -7.89501953125, -7.206298828125, -6.517578125, -5.828857421875, -5.14013671875, -4.451416015625, -3.7626953125, -3.073974609375, -2.38525390625, -1.696533203125, -1.0078125, -0.319091796875, 0.36962890625, 1.058349609375, 1.7470703125, 2.435791015625, 3.12451171875, 3.813232421875, 4.501953125, 5.190673828125, 5.87939453125, 6.568115234375, 7.2568359375, 7.945556640625, 8.63427734375, 9.322998046875, 10.01171875, 10.700439453125, 11.38916015625, 12.077880859375, 12.7666015625, 13.455322265625, 14.14404296875, 14.832763671875, 15.521484375, 16.210205078125, 16.89892578125, 17.587646484375, 18.2763671875, 18.965087890625, 19.65380859375, 20.342529296875, 21.03125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 294.0, 709.0, 10.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.29066467285156, -224.8906707763672, -220.4906768798828, -216.09068298339844, -211.69068908691406, -207.2906951904297, -202.8907012939453, -198.49069213867188, -194.0906982421875, -189.69070434570312, -185.29071044921875, -180.89071655273438, -176.49072265625, -172.09072875976562, -167.69073486328125, -163.29074096679688, -158.8907470703125, -154.49075317382812, -150.09075927734375, -145.69076538085938, -141.290771484375, -136.89077758789062, -132.49078369140625, -128.09078979492188, -123.69078826904297, -119.2907943725586, -114.89080047607422, -110.49080657958984, -106.09080505371094, -101.69081115722656, -97.29081726074219, -92.89082336425781, -88.49083709716797, -84.0908432006836, -79.69084930419922, -75.29085540771484, -70.89085388183594, -66.49085998535156, -62.09086608886719, -57.69087219238281, -53.29087829589844, -48.89088439941406, -44.49089050292969, -40.09089279174805, -35.69089889526367, -31.290904998779297, -26.89090919494629, -22.49091339111328, -18.090919494628906, -13.690924644470215, -9.290929794311523, -4.890934944152832, -0.4909400939941406, 3.9090538024902344, 8.309049606323242, 12.70904541015625, 17.109039306640625, 21.509033203125, 25.909029006958008, 30.309024810791016, 34.70901870727539, 39.109012603759766, 43.509010314941406, 47.90900421142578, 52.308998107910156]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 10.0, 6.0, 6.0, 14.0, 15.0, 15.0, 26.0, 29.0, 35.0, 34.0, 42.0, 38.0, 39.0, 54.0, 38.0, 63.0, 40.0, 40.0, 52.0, 53.0, 38.0, 40.0, 48.0, 33.0, 21.0, 27.0, 22.0, 18.0, 18.0, 21.0, 11.0, 9.0, 6.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.034442901611328, -19.45001220703125, -18.865581512451172, -18.281150817871094, -17.696720123291016, -17.11229133605957, -16.527860641479492, -15.943429946899414, -15.358999252319336, -14.774568557739258, -14.19013786315918, -13.605708122253418, -13.02127742767334, -12.436846733093262, -11.8524169921875, -11.267986297607422, -10.683555603027344, -10.099124908447266, -9.514694213867188, -8.930264472961426, -8.345833778381348, -7.7614030838012695, -7.17697286605835, -6.59254264831543, -6.008111953735352, -5.423681259155273, -4.8392510414123535, -4.254820823669434, -3.6703901290893555, -3.0859596729278564, -2.5015292167663574, -1.9170989990234375, -1.3326702117919922, -0.7482397556304932, -0.16380929946899414, 0.4206211566925049, 1.005051612854004, 1.589482069015503, 2.173912525177002, 2.758342742919922, 3.3427734375, 3.927203893661499, 4.511634349822998, 5.096064567565918, 5.680495262145996, 6.264925956726074, 6.849356174468994, 7.433786392211914, 8.018217086791992, 8.60264778137207, 9.187078475952148, 9.77150821685791, 10.355938911437988, 10.940369606018066, 11.524799346923828, 12.109230041503906, 12.693660736083984, 13.278091430664062, 13.86252212524414, 14.446951866149902, 15.03138256072998, 15.615813255310059, 16.20024299621582, 16.7846736907959, 17.369104385375977]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 11.0, 5.0, 7.0, 10.0, 11.0, 6.0, 12.0, 18.0, 21.0, 13.0, 23.0, 20.0, 24.0, 29.0, 31.0, 27.0, 27.0, 33.0, 26.0, 34.0, 34.0, 44.0, 45.0, 47.0, 45.0, 32.0, 33.0, 23.0, 33.0, 25.0, 33.0, 25.0, 27.0, 22.0, 18.0, 24.0, 20.0, 11.0, 14.0, 10.0, 10.0, 12.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.032379150390625, -0.99835205078125, -0.964324951171875, -0.9302978515625, -0.896270751953125, -0.86224365234375, -0.828216552734375, -0.794189453125, -0.760162353515625, -0.72613525390625, -0.692108154296875, -0.6580810546875, -0.624053955078125, -0.59002685546875, -0.555999755859375, -0.52197265625, -0.487945556640625, -0.45391845703125, -0.419891357421875, -0.3858642578125, -0.351837158203125, -0.31781005859375, -0.283782958984375, -0.249755859375, -0.215728759765625, -0.18170166015625, -0.147674560546875, -0.1136474609375, -0.079620361328125, -0.04559326171875, -0.011566162109375, 0.0224609375, 0.056488037109375, 0.09051513671875, 0.124542236328125, 0.1585693359375, 0.192596435546875, 0.22662353515625, 0.260650634765625, 0.294677734375, 0.328704833984375, 0.36273193359375, 0.396759033203125, 0.4307861328125, 0.464813232421875, 0.49884033203125, 0.532867431640625, 0.56689453125, 0.600921630859375, 0.63494873046875, 0.668975830078125, 0.7030029296875, 0.737030029296875, 0.77105712890625, 0.805084228515625, 0.839111328125, 0.873138427734375, 0.90716552734375, 0.941192626953125, 0.9752197265625, 1.009246826171875, 1.04327392578125, 1.077301025390625, 1.111328125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 11.0, 24.0, 24.0, 25.0, 50.0, 86.0, 137.0, 213.0, 302.0, 403.0, 732.0, 1084.0, 1653.0, 2619.0, 4081.0, 6619.0, 10496.0, 17099.0, 27926.0, 45922.0, 78847.0, 149047.0, 323990.0, 165198.0, 84497.0, 49332.0, 29557.0, 18126.0, 11362.0, 6977.0, 4440.0, 2777.0, 1726.0, 1103.0, 729.0, 455.0, 319.0, 174.0, 112.0, 90.0, 57.0, 44.0, 21.0, 19.0, 17.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2437744140625, -0.23628807067871094, -0.22880172729492188, -0.2213153839111328, -0.21382904052734375, -0.2063426971435547, -0.19885635375976562, -0.19137001037597656, -0.1838836669921875, -0.17639732360839844, -0.16891098022460938, -0.1614246368408203, -0.15393829345703125, -0.1464519500732422, -0.13896560668945312, -0.13147926330566406, -0.123992919921875, -0.11650657653808594, -0.10902023315429688, -0.10153388977050781, -0.09404754638671875, -0.08656120300292969, -0.07907485961914062, -0.07158851623535156, -0.0641021728515625, -0.05661582946777344, -0.049129486083984375, -0.04164314270019531, -0.03415679931640625, -0.026670455932617188, -0.019184112548828125, -0.011697769165039062, -0.00421142578125, 0.0032749176025390625, 0.010761260986328125, 0.018247604370117188, 0.02573394775390625, 0.03322029113769531, 0.040706634521484375, 0.04819297790527344, 0.0556793212890625, 0.06316566467285156, 0.07065200805664062, 0.07813835144042969, 0.08562469482421875, 0.09311103820800781, 0.10059738159179688, 0.10808372497558594, 0.115570068359375, 0.12305641174316406, 0.13054275512695312, 0.1380290985107422, 0.14551544189453125, 0.1530017852783203, 0.16048812866210938, 0.16797447204589844, 0.1754608154296875, 0.18294715881347656, 0.19043350219726562, 0.1979198455810547, 0.20540618896484375, 0.2128925323486328, 0.22037887573242188, 0.22786521911621094, 0.2353515625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 3.0, 6.0, 6.0, 5.0, 7.0, 8.0, 11.0, 12.0, 16.0, 14.0, 23.0, 32.0, 29.0, 29.0, 26.0, 21.0, 38.0, 31.0, 35.0, 40.0, 44.0, 41.0, 1065.0, 35.0, 35.0, 43.0, 31.0, 38.0, 30.0, 34.0, 22.0, 22.0, 18.0, 29.0, 28.0, 14.0, 13.0, 18.0, 15.0, 10.0, 11.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.72607421875, -0.703216552734375, -0.68035888671875, -0.657501220703125, -0.6346435546875, -0.611785888671875, -0.58892822265625, -0.566070556640625, -0.543212890625, -0.520355224609375, -0.49749755859375, -0.474639892578125, -0.4517822265625, -0.428924560546875, -0.40606689453125, -0.383209228515625, -0.3603515625, -0.337493896484375, -0.31463623046875, -0.291778564453125, -0.2689208984375, -0.246063232421875, -0.22320556640625, -0.200347900390625, -0.177490234375, -0.154632568359375, -0.13177490234375, -0.108917236328125, -0.0860595703125, -0.063201904296875, -0.04034423828125, -0.017486572265625, 0.00537109375, 0.028228759765625, 0.05108642578125, 0.073944091796875, 0.0968017578125, 0.119659423828125, 0.14251708984375, 0.165374755859375, 0.188232421875, 0.211090087890625, 0.23394775390625, 0.256805419921875, 0.2796630859375, 0.302520751953125, 0.32537841796875, 0.348236083984375, 0.37109375, 0.393951416015625, 0.41680908203125, 0.439666748046875, 0.4625244140625, 0.485382080078125, 0.50823974609375, 0.531097412109375, 0.553955078125, 0.576812744140625, 0.59967041015625, 0.622528076171875, 0.6453857421875, 0.668243408203125, 0.69110107421875, 0.713958740234375, 0.73681640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 12.0, 19.0, 34.0, 51.0, 71.0, 83.0, 133.0, 169.0, 292.0, 432.0, 528.0, 813.0, 1101.0, 1715.0, 2372.0, 3365.0, 5158.0, 7405.0, 10987.0, 16247.0, 24782.0, 39352.0, 63459.0, 112377.0, 1253693.0, 263974.0, 111353.0, 63116.0, 38834.0, 24805.0, 16195.0, 10821.0, 7183.0, 4971.0, 3420.0, 2335.0, 1677.0, 1175.0, 764.0, 542.0, 415.0, 300.0, 191.0, 108.0, 92.0, 73.0, 40.0, 38.0, 20.0, 6.0, 13.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.194580078125, -0.18849754333496094, -0.18241500854492188, -0.1763324737548828, -0.17024993896484375, -0.1641674041748047, -0.15808486938476562, -0.15200233459472656, -0.1459197998046875, -0.13983726501464844, -0.13375473022460938, -0.1276721954345703, -0.12158966064453125, -0.11550712585449219, -0.10942459106445312, -0.10334205627441406, -0.097259521484375, -0.09117698669433594, -0.08509445190429688, -0.07901191711425781, -0.07292938232421875, -0.06684684753417969, -0.060764312744140625, -0.05468177795410156, -0.0485992431640625, -0.04251670837402344, -0.036434173583984375, -0.030351638793945312, -0.02426910400390625, -0.018186569213867188, -0.012104034423828125, -0.0060214996337890625, 6.103515625e-05, 0.0061435699462890625, 0.012226104736328125, 0.018308639526367188, 0.02439117431640625, 0.030473709106445312, 0.036556243896484375, 0.04263877868652344, 0.0487213134765625, 0.05480384826660156, 0.060886383056640625, 0.06696891784667969, 0.07305145263671875, 0.07913398742675781, 0.08521652221679688, 0.09129905700683594, 0.097381591796875, 0.10346412658691406, 0.10954666137695312, 0.11562919616699219, 0.12171173095703125, 0.1277942657470703, 0.13387680053710938, 0.13995933532714844, 0.1460418701171875, 0.15212440490722656, 0.15820693969726562, 0.1642894744873047, 0.17037200927734375, 0.1764545440673828, 0.18253707885742188, 0.18861961364746094, 0.1947021484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 21.0, 28.0, 35.0, 57.0, 67.0, 86.0, 110.0, 125.0, 110.0, 99.0, 74.0, 56.0, 39.0, 30.0, 12.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002193450927734375, -0.00021141767501831055, -0.0002034902572631836, -0.00019556283950805664, -0.0001876354217529297, -0.00017970800399780273, -0.00017178058624267578, -0.00016385316848754883, -0.00015592575073242188, -0.00014799833297729492, -0.00014007091522216797, -0.00013214349746704102, -0.00012421607971191406, -0.00011628866195678711, -0.00010836124420166016, -0.0001004338264465332, -9.250640869140625e-05, -8.45789909362793e-05, -7.665157318115234e-05, -6.872415542602539e-05, -6.079673767089844e-05, -5.2869319915771484e-05, -4.494190216064453e-05, -3.701448440551758e-05, -2.9087066650390625e-05, -2.1159648895263672e-05, -1.3232231140136719e-05, -5.304813385009766e-06, 2.6226043701171875e-06, 1.055002212524414e-05, 1.8477439880371094e-05, 2.6404857635498047e-05, 3.4332275390625e-05, 4.225969314575195e-05, 5.0187110900878906e-05, 5.811452865600586e-05, 6.604194641113281e-05, 7.396936416625977e-05, 8.189678192138672e-05, 8.982419967651367e-05, 9.775161743164062e-05, 0.00010567903518676758, 0.00011360645294189453, 0.00012153387069702148, 0.00012946128845214844, 0.0001373887062072754, 0.00014531612396240234, 0.0001532435417175293, 0.00016117095947265625, 0.0001690983772277832, 0.00017702579498291016, 0.0001849532127380371, 0.00019288063049316406, 0.00020080804824829102, 0.00020873546600341797, 0.00021666288375854492, 0.00022459030151367188, 0.00023251771926879883, 0.00024044513702392578, 0.00024837255477905273, 0.0002562999725341797, 0.00026422739028930664, 0.0002721548080444336, 0.00028008222579956055, 0.0002880096435546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 8.0, 9.0, 11.0, 16.0, 31.0, 39.0, 73.0, 113.0, 195.0, 287.0, 619.0, 2068.0, 1042181.0, 1615.0, 552.0, 292.0, 177.0, 100.0, 71.0, 37.0, 16.0, 21.0, 13.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004764556884765625, -0.0046176910400390625, -0.0044708251953125, -0.0043239593505859375, -0.004177093505859375, -0.0040302276611328125, -0.00388336181640625, -0.0037364959716796875, -0.003589630126953125, -0.0034427642822265625, -0.0032958984375, -0.0031490325927734375, -0.003002166748046875, -0.0028553009033203125, -0.00270843505859375, -0.0025615692138671875, -0.002414703369140625, -0.0022678375244140625, -0.0021209716796875, -0.0019741058349609375, -0.001827239990234375, -0.0016803741455078125, -0.00153350830078125, -0.0013866424560546875, -0.001239776611328125, -0.0010929107666015625, -0.000946044921875, -0.0007991790771484375, -0.000652313232421875, -0.0005054473876953125, -0.00035858154296875, -0.0002117156982421875, -6.4849853515625e-05, 8.20159912109375e-05, 0.0002288818359375, 0.0003757476806640625, 0.000522613525390625, 0.0006694793701171875, 0.00081634521484375, 0.0009632110595703125, 0.001110076904296875, 0.0012569427490234375, 0.00140380859375, 0.0015506744384765625, 0.001697540283203125, 0.0018444061279296875, 0.00199127197265625, 0.0021381378173828125, 0.002285003662109375, 0.0024318695068359375, 0.0025787353515625, 0.0027256011962890625, 0.002872467041015625, 0.0030193328857421875, 0.00316619873046875, 0.0033130645751953125, 0.003459930419921875, 0.0036067962646484375, 0.003753662109375, 0.0039005279541015625, 0.004047393798828125, 0.0041942596435546875, 0.00434112548828125, 0.0044879913330078125, 0.004634857177734375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 16.0, 303.0, 585.0, 105.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00050628453027457, -0.0004960133810527623, -0.000485742260934785, -0.0004754711117129773, -0.00046519996249116957, -0.0004549288423731923, -0.0004446576931513846, -0.0004343865439295769, -0.00042411539470776916, -0.00041384424548596144, -0.0004035731253679842, -0.00039330197614617646, -0.00038303082692436874, -0.0003727597068063915, -0.00036248855758458376, -0.00035221740836277604, -0.0003419462882447988, -0.00033167513902299106, -0.0003214040189050138, -0.0003111328696832061, -0.00030086172046139836, -0.00029059057123959064, -0.0002803194511216134, -0.00027004830189980567, -0.0002597771817818284, -0.0002495060325600207, -0.0002392348978901282, -0.0002289637632202357, -0.000218692613998428, -0.0002084214793285355, -0.000198150344658643, -0.0001878791954368353, -0.00017760807531885803, -0.00016733694064896554, -0.00015706579142715782, -0.00014679465675726533, -0.0001365235075354576, -0.00012625237286556512, -0.00011598123819567263, -0.00010571009624982253, -9.543895430397242e-05, -8.516781235812232e-05, -7.489667041227221e-05, -6.462553574237972e-05, -5.435439379652962e-05, -4.408325185067952e-05, -3.381211718078703e-05, -2.3540975234936923e-05, -1.3269833289086819e-05, -2.998693162226118e-06, 7.272446964634582e-06, 1.754358527250588e-05, 2.7814727218355983e-05, 3.808586916420609e-05, 4.835700383409858e-05, 5.862814577994868e-05, 6.889928772579879e-05, 7.917042967164889e-05, 8.9441571617499e-05, 9.971270628739148e-05, 0.00010998384823324159, 0.00012025499017909169, 0.00013052612484898418, 0.00014079725951887667, 0.0001510684087406844]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 9.0, 8.0, 13.0, 19.0, 21.0, 16.0, 18.0, 19.0, 29.0, 37.0, 24.0, 35.0, 30.0, 53.0, 46.0, 35.0, 43.0, 42.0, 33.0, 40.0, 47.0, 52.0, 35.0, 40.0, 26.0, 26.0, 35.0, 30.0, 25.0, 21.0, 18.0, 12.0, 12.0, 7.0, 6.0, 11.0, 4.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.325410842895508e-05, -7.086247205734253e-05, -6.847083568572998e-05, -6.607919931411743e-05, -6.368756294250488e-05, -6.129592657089233e-05, -5.8904290199279785e-05, -5.6512653827667236e-05, -5.412101745605469e-05, -5.172938108444214e-05, -4.933774471282959e-05, -4.694610834121704e-05, -4.455447196960449e-05, -4.216283559799194e-05, -3.9771199226379395e-05, -3.7379562854766846e-05, -3.49879264831543e-05, -3.259629011154175e-05, -3.02046537399292e-05, -2.781301736831665e-05, -2.54213809967041e-05, -2.3029744625091553e-05, -2.0638108253479004e-05, -1.8246471881866455e-05, -1.5854835510253906e-05, -1.3463199138641357e-05, -1.1071562767028809e-05, -8.67992639541626e-06, -6.288290023803711e-06, -3.896653652191162e-06, -1.5050172805786133e-06, 8.866190910339355e-07, 3.2782554626464844e-06, 5.669891834259033e-06, 8.061528205871582e-06, 1.0453164577484131e-05, 1.284480094909668e-05, 1.5236437320709229e-05, 1.7628073692321777e-05, 2.0019710063934326e-05, 2.2411346435546875e-05, 2.4802982807159424e-05, 2.7194619178771973e-05, 2.958625555038452e-05, 3.197789192199707e-05, 3.436952829360962e-05, 3.676116466522217e-05, 3.915280103683472e-05, 4.1544437408447266e-05, 4.3936073780059814e-05, 4.632771015167236e-05, 4.871934652328491e-05, 5.111098289489746e-05, 5.350261926651001e-05, 5.589425563812256e-05, 5.828589200973511e-05, 6.0677528381347656e-05, 6.30691647529602e-05, 6.546080112457275e-05, 6.78524374961853e-05, 7.024407386779785e-05, 7.26357102394104e-05, 7.502734661102295e-05, 7.74189829826355e-05, 7.981061935424805e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 11.0, 5.0, 7.0, 10.0, 11.0, 6.0, 12.0, 18.0, 21.0, 13.0, 23.0, 20.0, 24.0, 29.0, 31.0, 27.0, 27.0, 33.0, 26.0, 34.0, 34.0, 44.0, 45.0, 47.0, 45.0, 32.0, 33.0, 23.0, 33.0, 25.0, 33.0, 25.0, 27.0, 22.0, 18.0, 24.0, 20.0, 11.0, 14.0, 10.0, 10.0, 12.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.032379150390625, -0.99835205078125, -0.964324951171875, -0.9302978515625, -0.896270751953125, -0.86224365234375, -0.828216552734375, -0.794189453125, -0.760162353515625, -0.72613525390625, -0.692108154296875, -0.6580810546875, -0.624053955078125, -0.59002685546875, -0.555999755859375, -0.52197265625, -0.487945556640625, -0.45391845703125, -0.419891357421875, -0.3858642578125, -0.351837158203125, -0.31781005859375, -0.283782958984375, -0.249755859375, -0.215728759765625, -0.18170166015625, -0.147674560546875, -0.1136474609375, -0.079620361328125, -0.04559326171875, -0.011566162109375, 0.0224609375, 0.056488037109375, 0.09051513671875, 0.124542236328125, 0.1585693359375, 0.192596435546875, 0.22662353515625, 0.260650634765625, 0.294677734375, 0.328704833984375, 0.36273193359375, 0.396759033203125, 0.4307861328125, 0.464813232421875, 0.49884033203125, 0.532867431640625, 0.56689453125, 0.600921630859375, 0.63494873046875, 0.668975830078125, 0.7030029296875, 0.737030029296875, 0.77105712890625, 0.805084228515625, 0.839111328125, 0.873138427734375, 0.90716552734375, 0.941192626953125, 0.9752197265625, 1.009246826171875, 1.04327392578125, 1.077301025390625, 1.111328125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 4.0, 9.0, 11.0, 21.0, 27.0, 37.0, 45.0, 73.0, 88.0, 110.0, 171.0, 270.0, 334.0, 519.0, 719.0, 1083.0, 1663.0, 2503.0, 4059.0, 7399.0, 17489.0, 70645.0, 506436.0, 354813.0, 48849.0, 14066.0, 6385.0, 3654.0, 2283.0, 1491.0, 957.0, 718.0, 507.0, 319.0, 196.0, 162.0, 125.0, 80.0, 74.0, 47.0, 29.0, 20.0, 13.0, 11.0, 10.0, 10.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.953125, -4.79278564453125, -4.6324462890625, -4.47210693359375, -4.311767578125, -4.15142822265625, -3.9910888671875, -3.83074951171875, -3.67041015625, -3.51007080078125, -3.3497314453125, -3.18939208984375, -3.029052734375, -2.86871337890625, -2.7083740234375, -2.54803466796875, -2.3876953125, -2.22735595703125, -2.0670166015625, -1.90667724609375, -1.746337890625, -1.58599853515625, -1.4256591796875, -1.26531982421875, -1.10498046875, -0.94464111328125, -0.7843017578125, -0.62396240234375, -0.463623046875, -0.30328369140625, -0.1429443359375, 0.01739501953125, 0.177734375, 0.33807373046875, 0.4984130859375, 0.65875244140625, 0.819091796875, 0.97943115234375, 1.1397705078125, 1.30010986328125, 1.46044921875, 1.62078857421875, 1.7811279296875, 1.94146728515625, 2.101806640625, 2.26214599609375, 2.4224853515625, 2.58282470703125, 2.7431640625, 2.90350341796875, 3.0638427734375, 3.22418212890625, 3.384521484375, 3.54486083984375, 3.7052001953125, 3.86553955078125, 4.02587890625, 4.18621826171875, 4.3465576171875, 4.50689697265625, 4.667236328125, 4.82757568359375, 4.9879150390625, 5.14825439453125, 5.30859375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 2.0, 3.0, 4.0, 11.0, 7.0, 8.0, 15.0, 13.0, 16.0, 18.0, 19.0, 20.0, 26.0, 18.0, 28.0, 24.0, 47.0, 38.0, 41.0, 68.0, 104.0, 239.0, 1374.0, 266.0, 128.0, 80.0, 39.0, 46.0, 37.0, 51.0, 27.0, 24.0, 31.0, 30.0, 29.0, 19.0, 13.0, 18.0, 15.0, 13.0, 9.0, 8.0, 3.0, 0.0, 6.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.6875, -3.580596923828125, -3.47369384765625, -3.366790771484375, -3.2598876953125, -3.152984619140625, -3.04608154296875, -2.939178466796875, -2.832275390625, -2.725372314453125, -2.61846923828125, -2.511566162109375, -2.4046630859375, -2.297760009765625, -2.19085693359375, -2.083953857421875, -1.97705078125, -1.870147705078125, -1.76324462890625, -1.656341552734375, -1.5494384765625, -1.442535400390625, -1.33563232421875, -1.228729248046875, -1.121826171875, -1.014923095703125, -0.90802001953125, -0.801116943359375, -0.6942138671875, -0.587310791015625, -0.48040771484375, -0.373504638671875, -0.2666015625, -0.159698486328125, -0.05279541015625, 0.054107666015625, 0.1610107421875, 0.267913818359375, 0.37481689453125, 0.481719970703125, 0.588623046875, 0.695526123046875, 0.80242919921875, 0.909332275390625, 1.0162353515625, 1.123138427734375, 1.23004150390625, 1.336944580078125, 1.44384765625, 1.550750732421875, 1.65765380859375, 1.764556884765625, 1.8714599609375, 1.978363037109375, 2.08526611328125, 2.192169189453125, 2.299072265625, 2.405975341796875, 2.51287841796875, 2.619781494140625, 2.7266845703125, 2.833587646484375, 2.94049072265625, 3.047393798828125, 3.154296875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 8.0, 8.0, 12.0, 11.0, 13.0, 18.0, 26.0, 18.0, 34.0, 35.0, 39.0, 59.0, 87.0, 118.0, 233.0, 451.0, 1447.0, 31931.0, 3073544.0, 35047.0, 1408.0, 469.0, 224.0, 127.0, 66.0, 54.0, 28.0, 27.0, 27.0, 20.0, 26.0, 14.0, 10.0, 8.0, 9.0, 8.0, 7.0, 4.0, 2.0, 4.0, 8.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.515625, -12.07666015625, -11.6376953125, -11.19873046875, -10.759765625, -10.32080078125, -9.8818359375, -9.44287109375, -9.00390625, -8.56494140625, -8.1259765625, -7.68701171875, -7.248046875, -6.80908203125, -6.3701171875, -5.93115234375, -5.4921875, -5.05322265625, -4.6142578125, -4.17529296875, -3.736328125, -3.29736328125, -2.8583984375, -2.41943359375, -1.98046875, -1.54150390625, -1.1025390625, -0.66357421875, -0.224609375, 0.21435546875, 0.6533203125, 1.09228515625, 1.53125, 1.97021484375, 2.4091796875, 2.84814453125, 3.287109375, 3.72607421875, 4.1650390625, 4.60400390625, 5.04296875, 5.48193359375, 5.9208984375, 6.35986328125, 6.798828125, 7.23779296875, 7.6767578125, 8.11572265625, 8.5546875, 8.99365234375, 9.4326171875, 9.87158203125, 10.310546875, 10.74951171875, 11.1884765625, 11.62744140625, 12.06640625, 12.50537109375, 12.9443359375, 13.38330078125, 13.822265625, 14.26123046875, 14.7001953125, 15.13916015625, 15.578125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 960.0, 56.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.90650177001953, -50.222145080566406, -44.53778839111328, -38.853431701660156, -33.16907501220703, -27.48472023010254, -21.800365447998047, -16.116008758544922, -10.431652069091797, -4.74729585647583, 0.9370603561401367, 6.621416091918945, 12.30577278137207, 17.990129470825195, 23.674484252929688, 29.358840942382812, 35.04319763183594, 40.72755432128906, 46.41191101074219, 52.09626770019531, 57.78062438964844, 63.46498107910156, 69.14933776855469, 74.83369445800781, 80.51805114746094, 86.20240783691406, 91.88676452636719, 97.57112121582031, 103.25547790527344, 108.93983459472656, 114.62419128417969, 120.30854797363281, 125.99290466308594, 131.67726135253906, 137.3616180419922, 143.0459747314453, 148.73033142089844, 154.41468811035156, 160.0990447998047, 165.7834014892578, 171.46775817871094, 177.15211486816406, 182.8364715576172, 188.5208282470703, 194.20518493652344, 199.88954162597656, 205.5738983154297, 211.2582550048828, 216.94259643554688, 222.626953125, 228.31130981445312, 233.99566650390625, 239.68002319335938, 245.3643798828125, 251.04873657226562, 256.73309326171875, 262.4174499511719, 268.101806640625, 273.7861633300781, 279.47052001953125, 285.1548767089844, 290.8392333984375, 296.5235900878906, 302.20794677734375, 307.8923034667969]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 9.0, 3.0, 4.0, 16.0, 16.0, 9.0, 23.0, 25.0, 15.0, 32.0, 31.0, 39.0, 36.0, 38.0, 23.0, 49.0, 56.0, 42.0, 45.0, 47.0, 28.0, 32.0, 42.0, 41.0, 33.0, 35.0, 29.0, 22.0, 25.0, 11.0, 23.0, 18.0, 8.0, 24.0, 13.0, 8.0, 13.0, 2.0, 5.0, 8.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.243245124816895, -10.839468955993652, -10.43569278717041, -10.031916618347168, -9.628141403198242, -9.224365234375, -8.820589065551758, -8.416812896728516, -8.013036727905273, -7.609260559082031, -7.205484390258789, -6.801708698272705, -6.397932529449463, -5.994156360626221, -5.590380668640137, -5.1866044998168945, -4.782828330993652, -4.37905216217041, -3.975276231765747, -3.571500301361084, -3.167724132537842, -2.7639479637145996, -2.3601720333099365, -1.9563961029052734, -1.5526199340820312, -1.1488438844680786, -0.745067834854126, -0.34129178524017334, 0.0624842643737793, 0.4662604331970215, 0.8700363636016846, 1.2738122940063477, 1.6775875091552734, 2.0813636779785156, 2.4851396083831787, 2.888915538787842, 3.292691707611084, 3.696467876434326, 4.10024356842041, 4.504019737243652, 4.9077959060668945, 5.311572074890137, 5.715348243713379, 6.119123935699463, 6.522900104522705, 6.926676273345947, 7.330451965332031, 7.734228134155273, 8.138004302978516, 8.541780471801758, 8.945556640625, 9.349332809448242, 9.753108978271484, 10.156885147094727, 10.560660362243652, 10.964436531066895, 11.368212699890137, 11.771988868713379, 12.175765037536621, 12.579541206359863, 12.983316421508789, 13.387092590332031, 13.790868759155273, 14.194644927978516, 14.598421096801758]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 15.0, 6.0, 12.0, 14.0, 8.0, 18.0, 16.0, 19.0, 20.0, 26.0, 32.0, 22.0, 24.0, 29.0, 27.0, 25.0, 24.0, 41.0, 44.0, 48.0, 39.0, 45.0, 34.0, 43.0, 26.0, 28.0, 34.0, 26.0, 29.0, 22.0, 30.0, 30.0, 21.0, 18.0, 9.0, 14.0, 15.0, 20.0, 10.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.2529296875, -1.21636962890625, -1.1798095703125, -1.14324951171875, -1.106689453125, -1.07012939453125, -1.0335693359375, -0.99700927734375, -0.96044921875, -0.92388916015625, -0.8873291015625, -0.85076904296875, -0.814208984375, -0.77764892578125, -0.7410888671875, -0.70452880859375, -0.66796875, -0.63140869140625, -0.5948486328125, -0.55828857421875, -0.521728515625, -0.48516845703125, -0.4486083984375, -0.41204833984375, -0.37548828125, -0.33892822265625, -0.3023681640625, -0.26580810546875, -0.229248046875, -0.19268798828125, -0.1561279296875, -0.11956787109375, -0.0830078125, -0.04644775390625, -0.0098876953125, 0.02667236328125, 0.063232421875, 0.09979248046875, 0.1363525390625, 0.17291259765625, 0.20947265625, 0.24603271484375, 0.2825927734375, 0.31915283203125, 0.355712890625, 0.39227294921875, 0.4288330078125, 0.46539306640625, 0.501953125, 0.53851318359375, 0.5750732421875, 0.61163330078125, 0.648193359375, 0.68475341796875, 0.7213134765625, 0.75787353515625, 0.79443359375, 0.83099365234375, 0.8675537109375, 0.90411376953125, 0.940673828125, 0.97723388671875, 1.0137939453125, 1.05035400390625, 1.0869140625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 24.0, 30.0, 36.0, 52.0, 57.0, 83.0, 103.0, 152.0, 242.0, 359.0, 511.0, 827.0, 1439.0, 2827.0, 6366.0, 17360.0, 66136.0, 514416.0, 2859697.0, 617148.0, 73559.0, 18923.0, 6806.0, 3008.0, 1502.0, 908.0, 507.0, 353.0, 229.0, 174.0, 109.0, 74.0, 63.0, 42.0, 35.0, 24.0, 12.0, 17.0, 11.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.0390625, -4.8887939453125, -4.738525390625, -4.5882568359375, -4.43798828125, -4.2877197265625, -4.137451171875, -3.9871826171875, -3.8369140625, -3.6866455078125, -3.536376953125, -3.3861083984375, -3.23583984375, -3.0855712890625, -2.935302734375, -2.7850341796875, -2.634765625, -2.4844970703125, -2.334228515625, -2.1839599609375, -2.03369140625, -1.8834228515625, -1.733154296875, -1.5828857421875, -1.4326171875, -1.2823486328125, -1.132080078125, -0.9818115234375, -0.83154296875, -0.6812744140625, -0.531005859375, -0.3807373046875, -0.23046875, -0.0802001953125, 0.070068359375, 0.2203369140625, 0.37060546875, 0.5208740234375, 0.671142578125, 0.8214111328125, 0.9716796875, 1.1219482421875, 1.272216796875, 1.4224853515625, 1.57275390625, 1.7230224609375, 1.873291015625, 2.0235595703125, 2.173828125, 2.3240966796875, 2.474365234375, 2.6246337890625, 2.77490234375, 2.9251708984375, 3.075439453125, 3.2257080078125, 3.3759765625, 3.5262451171875, 3.676513671875, 3.8267822265625, 3.97705078125, 4.1273193359375, 4.277587890625, 4.4278564453125, 4.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 10.0, 3.0, 18.0, 17.0, 46.0, 78.0, 125.0, 169.0, 311.0, 493.0, 590.0, 711.0, 511.0, 339.0, 231.0, 157.0, 112.0, 64.0, 33.0, 21.0, 22.0, 6.0, 4.0, 3.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.86236572265625, -8.6466064453125, -8.43084716796875, -8.215087890625, -7.99932861328125, -7.7835693359375, -7.56781005859375, -7.35205078125, -7.13629150390625, -6.9205322265625, -6.70477294921875, -6.489013671875, -6.27325439453125, -6.0574951171875, -5.84173583984375, -5.6259765625, -5.41021728515625, -5.1944580078125, -4.97869873046875, -4.762939453125, -4.54718017578125, -4.3314208984375, -4.11566162109375, -3.89990234375, -3.68414306640625, -3.4683837890625, -3.25262451171875, -3.036865234375, -2.82110595703125, -2.6053466796875, -2.38958740234375, -2.173828125, -1.95806884765625, -1.7423095703125, -1.52655029296875, -1.310791015625, -1.09503173828125, -0.8792724609375, -0.66351318359375, -0.44775390625, -0.23199462890625, -0.0162353515625, 0.19952392578125, 0.415283203125, 0.63104248046875, 0.8468017578125, 1.06256103515625, 1.2783203125, 1.49407958984375, 1.7098388671875, 1.92559814453125, 2.141357421875, 2.35711669921875, 2.5728759765625, 2.78863525390625, 3.00439453125, 3.22015380859375, 3.4359130859375, 3.65167236328125, 3.867431640625, 4.08319091796875, 4.2989501953125, 4.51470947265625, 4.73046875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [5.0, 4.0, 12.0, 13.0, 10.0, 25.0, 56.0, 73.0, 113.0, 192.0, 535.0, 2456.0, 449861.0, 3734267.0, 5573.0, 676.0, 218.0, 99.0, 53.0, 19.0, 20.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5625, -10.68359375, -9.8046875, -8.92578125, -8.046875, -7.16796875, -6.2890625, -5.41015625, -4.53125, -3.65234375, -2.7734375, -1.89453125, -1.015625, -0.13671875, 0.7421875, 1.62109375, 2.5, 3.37890625, 4.2578125, 5.13671875, 6.015625, 6.89453125, 7.7734375, 8.65234375, 9.53125, 10.41015625, 11.2890625, 12.16796875, 13.046875, 13.92578125, 14.8046875, 15.68359375, 16.5625, 17.44140625, 18.3203125, 19.19921875, 20.078125, 20.95703125, 21.8359375, 22.71484375, 23.59375, 24.47265625, 25.3515625, 26.23046875, 27.109375, 27.98828125, 28.8671875, 29.74609375, 30.625, 31.50390625, 32.3828125, 33.26171875, 34.140625, 35.01953125, 35.8984375, 36.77734375, 37.65625, 38.53515625, 39.4140625, 40.29296875, 41.171875, 42.05078125, 42.9296875, 43.80859375, 44.6875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 770.0, 245.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.78044128417969, -51.89575958251953, -46.01108169555664, -40.12640380859375, -34.241722106933594, -28.35704231262207, -22.472362518310547, -16.587684631347656, -10.7030029296875, -4.818323135375977, 1.0663566589355469, 6.95103645324707, 12.835716247558594, 18.720396041870117, 24.60507583618164, 30.48975372314453, 36.37443542480469, 42.259117126464844, 48.143795013427734, 54.028472900390625, 59.91315460205078, 65.79783630371094, 71.68251037597656, 77.56719207763672, 83.45187377929688, 89.33655548095703, 95.22123718261719, 101.10591125488281, 106.99059295654297, 112.87527465820312, 118.75994873046875, 124.6446304321289, 130.529296875, 136.41397094726562, 142.2986602783203, 148.18333435058594, 154.06802368164062, 159.95269775390625, 165.83737182617188, 171.7220458984375, 177.6067352294922, 183.4914093017578, 189.3760986328125, 195.26077270507812, 201.14544677734375, 207.03013610839844, 212.91481018066406, 218.79949951171875, 224.68417358398438, 230.56884765625, 236.4535369873047, 242.3382110595703, 248.222900390625, 254.10757446289062, 259.99224853515625, 265.8769226074219, 271.7615966796875, 277.6462707519531, 283.53094482421875, 289.4156494140625, 295.3003234863281, 301.18499755859375, 307.0696716308594, 312.954345703125, 318.83905029296875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 7.0, 16.0, 8.0, 15.0, 19.0, 24.0, 19.0, 23.0, 30.0, 34.0, 32.0, 36.0, 44.0, 37.0, 35.0, 48.0, 48.0, 43.0, 51.0, 43.0, 48.0, 50.0, 34.0, 39.0, 32.0, 29.0, 35.0, 20.0, 10.0, 19.0, 13.0, 9.0, 9.0, 8.0, 8.0, 7.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-23.02631378173828, -22.363508224487305, -21.700700759887695, -21.03789520263672, -20.37508773803711, -19.712282180786133, -19.049474716186523, -18.386669158935547, -17.723861694335938, -17.06105613708496, -16.39824867248535, -15.735442161560059, -15.072635650634766, -14.409830093383789, -13.747023582458496, -13.084217071533203, -12.421411514282227, -11.758605003356934, -11.09579849243164, -10.432991981506348, -9.770185470581055, -9.107379913330078, -8.444573402404785, -7.781766891479492, -7.118960380554199, -6.456153869628906, -5.793347358703613, -5.1305413246154785, -4.4677348136901855, -3.8049283027648926, -3.1421220302581787, -2.479315757751465, -1.8165092468261719, -1.1537028551101685, -0.49089646339416504, 0.17190992832183838, 0.8347163200378418, 1.4975228309631348, 2.1603291034698486, 2.8231353759765625, 3.4859418869018555, 4.148748397827148, 4.811554908752441, 5.474360942840576, 6.137167453765869, 6.799973964691162, 7.462779998779297, 8.12558650970459, 8.788393020629883, 9.451199531555176, 10.114006042480469, 10.776812553405762, 11.439619064331055, 12.102424621582031, 12.765231132507324, 13.428037643432617, 14.09084415435791, 14.753650665283203, 15.416457176208496, 16.07926368713379, 16.742069244384766, 17.404876708984375, 18.06768226623535, 18.730487823486328, 19.393295288085938]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 9.0, 8.0, 15.0, 19.0, 15.0, 26.0, 24.0, 29.0, 25.0, 26.0, 24.0, 31.0, 39.0, 38.0, 33.0, 36.0, 37.0, 43.0, 47.0, 37.0, 36.0, 32.0, 37.0, 38.0, 29.0, 24.0, 29.0, 26.0, 19.0, 25.0, 24.0, 26.0, 10.0, 11.0, 7.0, 11.0, 9.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.3779296875, -1.339202880859375, -1.30047607421875, -1.261749267578125, -1.2230224609375, -1.184295654296875, -1.14556884765625, -1.106842041015625, -1.068115234375, -1.029388427734375, -0.99066162109375, -0.951934814453125, -0.9132080078125, -0.874481201171875, -0.83575439453125, -0.797027587890625, -0.75830078125, -0.719573974609375, -0.68084716796875, -0.642120361328125, -0.6033935546875, -0.564666748046875, -0.52593994140625, -0.487213134765625, -0.448486328125, -0.409759521484375, -0.37103271484375, -0.332305908203125, -0.2935791015625, -0.254852294921875, -0.21612548828125, -0.177398681640625, -0.138671875, -0.099945068359375, -0.06121826171875, -0.022491455078125, 0.0162353515625, 0.054962158203125, 0.09368896484375, 0.132415771484375, 0.171142578125, 0.209869384765625, 0.24859619140625, 0.287322998046875, 0.3260498046875, 0.364776611328125, 0.40350341796875, 0.442230224609375, 0.48095703125, 0.519683837890625, 0.55841064453125, 0.597137451171875, 0.6358642578125, 0.674591064453125, 0.71331787109375, 0.752044677734375, 0.790771484375, 0.829498291015625, 0.86822509765625, 0.906951904296875, 0.9456787109375, 0.984405517578125, 1.02313232421875, 1.061859130859375, 1.1005859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 12.0, 17.0, 24.0, 24.0, 39.0, 52.0, 80.0, 112.0, 193.0, 282.0, 465.0, 691.0, 1142.0, 1924.0, 3093.0, 5257.0, 8927.0, 15091.0, 25303.0, 42881.0, 74932.0, 145783.0, 314831.0, 189454.0, 91957.0, 51160.0, 30220.0, 18036.0, 10646.0, 6194.0, 3791.0, 2289.0, 1371.0, 814.0, 464.0, 333.0, 219.0, 155.0, 98.0, 73.0, 44.0, 28.0, 20.0, 10.0, 9.0, 5.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0], "bins": [-0.28564453125, -0.27740478515625, -0.2691650390625, -0.26092529296875, -0.252685546875, -0.24444580078125, -0.2362060546875, -0.22796630859375, -0.2197265625, -0.21148681640625, -0.2032470703125, -0.19500732421875, -0.186767578125, -0.17852783203125, -0.1702880859375, -0.16204833984375, -0.15380859375, -0.14556884765625, -0.1373291015625, -0.12908935546875, -0.120849609375, -0.11260986328125, -0.1043701171875, -0.09613037109375, -0.087890625, -0.07965087890625, -0.0714111328125, -0.06317138671875, -0.054931640625, -0.04669189453125, -0.0384521484375, -0.03021240234375, -0.02197265625, -0.01373291015625, -0.0054931640625, 0.00274658203125, 0.010986328125, 0.01922607421875, 0.0274658203125, 0.03570556640625, 0.0439453125, 0.05218505859375, 0.0604248046875, 0.06866455078125, 0.076904296875, 0.08514404296875, 0.0933837890625, 0.10162353515625, 0.10986328125, 0.11810302734375, 0.1263427734375, 0.13458251953125, 0.142822265625, 0.15106201171875, 0.1593017578125, 0.16754150390625, 0.17578125, 0.18402099609375, 0.1922607421875, 0.20050048828125, 0.208740234375, 0.21697998046875, 0.2252197265625, 0.23345947265625, 0.24169921875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 6.0, 12.0, 12.0, 14.0, 22.0, 12.0, 22.0, 22.0, 33.0, 31.0, 35.0, 44.0, 35.0, 43.0, 38.0, 46.0, 46.0, 1063.0, 47.0, 40.0, 48.0, 38.0, 36.0, 38.0, 24.0, 21.0, 31.0, 33.0, 24.0, 23.0, 13.0, 18.0, 7.0, 8.0, 7.0, 6.0, 4.0, 6.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.830078125, -0.8025436401367188, -0.7750091552734375, -0.7474746704101562, -0.719940185546875, -0.6924057006835938, -0.6648712158203125, -0.6373367309570312, -0.60980224609375, -0.5822677612304688, -0.5547332763671875, -0.5271987915039062, -0.499664306640625, -0.47212982177734375, -0.4445953369140625, -0.41706085205078125, -0.3895263671875, -0.36199188232421875, -0.3344573974609375, -0.30692291259765625, -0.279388427734375, -0.25185394287109375, -0.2243194580078125, -0.19678497314453125, -0.16925048828125, -0.14171600341796875, -0.1141815185546875, -0.08664703369140625, -0.059112548828125, -0.03157806396484375, -0.0040435791015625, 0.02349090576171875, 0.051025390625, 0.07855987548828125, 0.1060943603515625, 0.13362884521484375, 0.161163330078125, 0.18869781494140625, 0.2162322998046875, 0.24376678466796875, 0.27130126953125, 0.29883575439453125, 0.3263702392578125, 0.35390472412109375, 0.381439208984375, 0.40897369384765625, 0.4365081787109375, 0.46404266357421875, 0.4915771484375, 0.5191116333007812, 0.5466461181640625, 0.5741806030273438, 0.601715087890625, 0.6292495727539062, 0.6567840576171875, 0.6843185424804688, 0.71185302734375, 0.7393875122070312, 0.7669219970703125, 0.7944564819335938, 0.821990966796875, 0.8495254516601562, 0.8770599365234375, 0.9045944213867188, 0.93212890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 10.0, 12.0, 14.0, 27.0, 36.0, 58.0, 71.0, 109.0, 165.0, 246.0, 347.0, 516.0, 717.0, 1119.0, 1657.0, 2609.0, 3925.0, 6104.0, 9618.0, 15148.0, 24681.0, 41662.0, 73662.0, 147079.0, 1361971.0, 189366.0, 89605.0, 49602.0, 28669.0, 17219.0, 10838.0, 7004.0, 4461.0, 2947.0, 1915.0, 1246.0, 875.0, 585.0, 381.0, 270.0, 187.0, 135.0, 91.0, 48.0, 44.0, 27.0, 26.0, 12.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23046875, -0.22294998168945312, -0.21543121337890625, -0.20791244506835938, -0.2003936767578125, -0.19287490844726562, -0.18535614013671875, -0.17783737182617188, -0.170318603515625, -0.16279983520507812, -0.15528106689453125, -0.14776229858398438, -0.1402435302734375, -0.13272476196289062, -0.12520599365234375, -0.11768722534179688, -0.11016845703125, -0.10264968872070312, -0.09513092041015625, -0.08761215209960938, -0.0800933837890625, -0.07257461547851562, -0.06505584716796875, -0.057537078857421875, -0.050018310546875, -0.042499542236328125, -0.03498077392578125, -0.027462005615234375, -0.0199432373046875, -0.012424468994140625, -0.00490570068359375, 0.002613067626953125, 0.0101318359375, 0.017650604248046875, 0.02516937255859375, 0.032688140869140625, 0.0402069091796875, 0.047725677490234375, 0.05524444580078125, 0.06276321411132812, 0.070281982421875, 0.07780075073242188, 0.08531951904296875, 0.09283828735351562, 0.1003570556640625, 0.10787582397460938, 0.11539459228515625, 0.12291336059570312, 0.13043212890625, 0.13795089721679688, 0.14546966552734375, 0.15298843383789062, 0.1605072021484375, 0.16802597045898438, 0.17554473876953125, 0.18306350708007812, 0.190582275390625, 0.19810104370117188, 0.20561981201171875, 0.21313858032226562, 0.2206573486328125, 0.22817611694335938, 0.23569488525390625, 0.24321365356445312, 0.250732421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 3.0, 4.0, 2.0, 8.0, 11.0, 17.0, 10.0, 13.0, 19.0, 21.0, 27.0, 24.0, 40.0, 35.0, 39.0, 32.0, 34.0, 42.0, 50.0, 43.0, 40.0, 50.0, 46.0, 50.0, 42.0, 42.0, 37.0, 26.0, 23.0, 29.0, 24.0, 18.0, 13.0, 13.0, 15.0, 13.0, 11.0, 7.0, 5.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.79304313659668e-05, -9.470432996749878e-05, -9.147822856903076e-05, -8.825212717056274e-05, -8.502602577209473e-05, -8.179992437362671e-05, -7.857382297515869e-05, -7.534772157669067e-05, -7.212162017822266e-05, -6.889551877975464e-05, -6.566941738128662e-05, -6.24433159828186e-05, -5.9217214584350586e-05, -5.599111318588257e-05, -5.276501178741455e-05, -4.953891038894653e-05, -4.6312808990478516e-05, -4.30867075920105e-05, -3.986060619354248e-05, -3.663450479507446e-05, -3.3408403396606445e-05, -3.0182301998138428e-05, -2.695620059967041e-05, -2.3730099201202393e-05, -2.0503997802734375e-05, -1.7277896404266357e-05, -1.405179500579834e-05, -1.0825693607330322e-05, -7.599592208862305e-06, -4.373490810394287e-06, -1.1473894119262695e-06, 2.078711986541748e-06, 5.304813385009766e-06, 8.530914783477783e-06, 1.17570161819458e-05, 1.4983117580413818e-05, 1.8209218978881836e-05, 2.1435320377349854e-05, 2.466142177581787e-05, 2.788752317428589e-05, 3.1113624572753906e-05, 3.4339725971221924e-05, 3.756582736968994e-05, 4.079192876815796e-05, 4.4018030166625977e-05, 4.7244131565093994e-05, 5.047023296356201e-05, 5.369633436203003e-05, 5.692243576049805e-05, 6.0148537158966064e-05, 6.337463855743408e-05, 6.66007399559021e-05, 6.982684135437012e-05, 7.305294275283813e-05, 7.627904415130615e-05, 7.950514554977417e-05, 8.273124694824219e-05, 8.59573483467102e-05, 8.918344974517822e-05, 9.240955114364624e-05, 9.563565254211426e-05, 9.886175394058228e-05, 0.00010208785533905029, 0.00010531395673751831, 0.00010854005813598633]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 10.0, 10.0, 14.0, 12.0, 20.0, 25.0, 26.0, 44.0, 58.0, 63.0, 74.0, 83.0, 118.0, 126.0, 157.0, 226.0, 332.0, 527.0, 1289.0, 217665.0, 823049.0, 2369.0, 642.0, 440.0, 254.0, 193.0, 135.0, 109.0, 89.0, 80.0, 63.0, 45.0, 38.0, 22.0, 27.0, 17.0, 22.0, 17.0, 12.0, 10.0, 14.0, 4.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0021381378173828125, -0.002075508236885071, -0.002012878656387329, -0.0019502490758895874, -0.0018876194953918457, -0.001824989914894104, -0.0017623603343963623, -0.0016997307538986206, -0.001637101173400879, -0.0015744715929031372, -0.0015118420124053955, -0.0014492124319076538, -0.0013865828514099121, -0.0013239532709121704, -0.0012613236904144287, -0.001198694109916687, -0.0011360645294189453, -0.0010734349489212036, -0.001010805368423462, -0.0009481757879257202, -0.0008855462074279785, -0.0008229166269302368, -0.0007602870464324951, -0.0006976574659347534, -0.0006350278854370117, -0.00057239830493927, -0.0005097687244415283, -0.0004471391439437866, -0.0003845095634460449, -0.0003218799829483032, -0.0002592504024505615, -0.00019662082195281982, -0.00013399124145507812, -7.136166095733643e-05, -8.732080459594727e-06, 5.389750003814697e-05, 0.00011652708053588867, 0.00017915666103363037, 0.00024178624153137207, 0.00030441582202911377, 0.00036704540252685547, 0.00042967498302459717, 0.0004923045635223389, 0.0005549341440200806, 0.0006175637245178223, 0.000680193305015564, 0.0007428228855133057, 0.0008054524660110474, 0.0008680820465087891, 0.0009307116270065308, 0.0009933412075042725, 0.0010559707880020142, 0.0011186003684997559, 0.0011812299489974976, 0.0012438595294952393, 0.001306489109992981, 0.0013691186904907227, 0.0014317482709884644, 0.001494377851486206, 0.0015570074319839478, 0.0016196370124816895, 0.0016822665929794312, 0.0017448961734771729, 0.0018075257539749146, 0.0018701553344726562]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 24.0, 106.0, 240.0, 321.0, 211.0, 81.0, 25.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000263611989794299, -0.0002574029203969985, -0.0002511938218958676, -0.0002449847524985671, -0.0002387756685493514, -0.00023256658460013568, -0.00022635750065091997, -0.00022014841670170426, -0.00021393934730440378, -0.00020773026335518807, -0.00020152117940597236, -0.00019531211000867188, -0.00018910302605945617, -0.00018289394211024046, -0.00017668485816102475, -0.00017047577421180904, -0.00016426670481450856, -0.00015805762086529285, -0.00015184853691607714, -0.00014563946751877666, -0.00013943038356956095, -0.00013322129962034523, -0.00012701221567112952, -0.00012080313899787143, -0.0001145940477726981, -0.0001083849638234824, -0.0001021758871502243, -9.596680320100859e-05, -8.975772652775049e-05, -8.354864257853478e-05, -7.733955862931907e-05, -7.113048195606098e-05, -6.492140528280288e-05, -5.871232497156598e-05, -5.2503244660329074e-05, -4.6294160711113364e-05, -4.008508403785527e-05, -3.387600008863956e-05, -2.7666919777402654e-05, -2.145783946616575e-05, -1.5248759154928848e-05, -9.039678843691945e-06, -2.8305976229603402e-06, 3.3784835977712646e-06, 9.587563909008168e-06, 1.5796646039234474e-05, 2.2005726350471377e-05, 2.821480666170828e-05, 3.4423886972945184e-05, 4.0632967284182087e-05, 4.684204759541899e-05, 5.30511315446347e-05, 5.9260208217892796e-05, 6.54692921671085e-05, 7.16783688403666e-05, 7.788745278958231e-05, 8.409653673879802e-05, 9.030562068801373e-05, 9.651469736127183e-05, 0.00010272378131048754, 0.00010893285798374563, 0.00011514194193296134, 0.00012135102588217705, 0.00012756010983139277, 0.00013376917922869325]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 5.0, 7.0, 11.0, 16.0, 10.0, 15.0, 15.0, 18.0, 29.0, 30.0, 29.0, 26.0, 29.0, 36.0, 22.0, 56.0, 41.0, 40.0, 39.0, 47.0, 40.0, 49.0, 31.0, 29.0, 37.0, 29.0, 33.0, 35.0, 32.0, 24.0, 22.0, 18.0, 14.0, 21.0, 12.0, 9.0, 12.0, 7.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.598234176635742e-05, -6.400793790817261e-05, -6.203353404998779e-05, -6.005913019180298e-05, -5.8084726333618164e-05, -5.611032247543335e-05, -5.4135918617248535e-05, -5.216151475906372e-05, -5.0187110900878906e-05, -4.821270704269409e-05, -4.623830318450928e-05, -4.426389932632446e-05, -4.228949546813965e-05, -4.0315091609954834e-05, -3.834068775177002e-05, -3.6366283893585205e-05, -3.439188003540039e-05, -3.2417476177215576e-05, -3.0443072319030762e-05, -2.8468668460845947e-05, -2.6494264602661133e-05, -2.451986074447632e-05, -2.2545456886291504e-05, -2.057105302810669e-05, -1.8596649169921875e-05, -1.662224531173706e-05, -1.4647841453552246e-05, -1.2673437595367432e-05, -1.0699033737182617e-05, -8.724629878997803e-06, -6.750226020812988e-06, -4.775822162628174e-06, -2.8014183044433594e-06, -8.270144462585449e-07, 1.1473894119262695e-06, 3.121793270111084e-06, 5.0961971282958984e-06, 7.070600986480713e-06, 9.045004844665527e-06, 1.1019408702850342e-05, 1.2993812561035156e-05, 1.496821641921997e-05, 1.6942620277404785e-05, 1.89170241355896e-05, 2.0891427993774414e-05, 2.286583185195923e-05, 2.4840235710144043e-05, 2.6814639568328857e-05, 2.8789043426513672e-05, 3.0763447284698486e-05, 3.27378511428833e-05, 3.4712255001068115e-05, 3.668665885925293e-05, 3.8661062717437744e-05, 4.063546657562256e-05, 4.260987043380737e-05, 4.458427429199219e-05, 4.6558678150177e-05, 4.8533082008361816e-05, 5.050748586654663e-05, 5.2481889724731445e-05, 5.445629358291626e-05, 5.6430697441101074e-05, 5.840510129928589e-05, 6.03795051574707e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 9.0, 8.0, 15.0, 19.0, 15.0, 26.0, 24.0, 29.0, 25.0, 26.0, 24.0, 31.0, 39.0, 38.0, 33.0, 36.0, 37.0, 43.0, 47.0, 37.0, 36.0, 32.0, 37.0, 38.0, 29.0, 24.0, 29.0, 26.0, 19.0, 25.0, 24.0, 26.0, 10.0, 11.0, 7.0, 11.0, 9.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.3779296875, -1.339202880859375, -1.30047607421875, -1.261749267578125, -1.2230224609375, -1.184295654296875, -1.14556884765625, -1.106842041015625, -1.068115234375, -1.029388427734375, -0.99066162109375, -0.951934814453125, -0.9132080078125, -0.874481201171875, -0.83575439453125, -0.797027587890625, -0.75830078125, -0.719573974609375, -0.68084716796875, -0.642120361328125, -0.6033935546875, -0.564666748046875, -0.52593994140625, -0.487213134765625, -0.448486328125, -0.409759521484375, -0.37103271484375, -0.332305908203125, -0.2935791015625, -0.254852294921875, -0.21612548828125, -0.177398681640625, -0.138671875, -0.099945068359375, -0.06121826171875, -0.022491455078125, 0.0162353515625, 0.054962158203125, 0.09368896484375, 0.132415771484375, 0.171142578125, 0.209869384765625, 0.24859619140625, 0.287322998046875, 0.3260498046875, 0.364776611328125, 0.40350341796875, 0.442230224609375, 0.48095703125, 0.519683837890625, 0.55841064453125, 0.597137451171875, 0.6358642578125, 0.674591064453125, 0.71331787109375, 0.752044677734375, 0.790771484375, 0.829498291015625, 0.86822509765625, 0.906951904296875, 0.9456787109375, 0.984405517578125, 1.02313232421875, 1.061859130859375, 1.1005859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 11.0, 9.0, 17.0, 16.0, 23.0, 40.0, 61.0, 67.0, 112.0, 136.0, 203.0, 297.0, 405.0, 708.0, 1196.0, 2100.0, 4135.0, 8320.0, 18818.0, 45157.0, 109850.0, 233362.0, 300918.0, 182887.0, 79674.0, 32335.0, 13680.0, 6383.0, 3213.0, 1673.0, 961.0, 559.0, 374.0, 227.0, 198.0, 107.0, 88.0, 65.0, 41.0, 49.0, 24.0, 16.0, 15.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.763671875, -1.7137298583984375, -1.663787841796875, -1.6138458251953125, -1.56390380859375, -1.5139617919921875, -1.464019775390625, -1.4140777587890625, -1.3641357421875, -1.3141937255859375, -1.264251708984375, -1.2143096923828125, -1.16436767578125, -1.1144256591796875, -1.064483642578125, -1.0145416259765625, -0.964599609375, -0.9146575927734375, -0.864715576171875, -0.8147735595703125, -0.76483154296875, -0.7148895263671875, -0.664947509765625, -0.6150054931640625, -0.5650634765625, -0.5151214599609375, -0.465179443359375, -0.4152374267578125, -0.36529541015625, -0.3153533935546875, -0.265411376953125, -0.2154693603515625, -0.16552734375, -0.1155853271484375, -0.065643310546875, -0.0157012939453125, 0.03424072265625, 0.0841827392578125, 0.134124755859375, 0.1840667724609375, 0.2340087890625, 0.2839508056640625, 0.333892822265625, 0.3838348388671875, 0.43377685546875, 0.4837188720703125, 0.533660888671875, 0.5836029052734375, 0.633544921875, 0.6834869384765625, 0.733428955078125, 0.7833709716796875, 0.83331298828125, 0.8832550048828125, 0.933197021484375, 0.9831390380859375, 1.0330810546875, 1.0830230712890625, 1.132965087890625, 1.1829071044921875, 1.23284912109375, 1.2827911376953125, 1.332733154296875, 1.3826751708984375, 1.4326171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 3.0, 5.0, 12.0, 15.0, 11.0, 13.0, 20.0, 25.0, 23.0, 35.0, 30.0, 38.0, 46.0, 46.0, 59.0, 86.0, 154.0, 315.0, 1390.0, 197.0, 99.0, 67.0, 51.0, 40.0, 38.0, 37.0, 24.0, 23.0, 18.0, 26.0, 18.0, 10.0, 16.0, 8.0, 7.0, 10.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.67431640625, -4.5244140625, -4.37451171875, -4.224609375, -4.07470703125, -3.9248046875, -3.77490234375, -3.625, -3.47509765625, -3.3251953125, -3.17529296875, -3.025390625, -2.87548828125, -2.7255859375, -2.57568359375, -2.42578125, -2.27587890625, -2.1259765625, -1.97607421875, -1.826171875, -1.67626953125, -1.5263671875, -1.37646484375, -1.2265625, -1.07666015625, -0.9267578125, -0.77685546875, -0.626953125, -0.47705078125, -0.3271484375, -0.17724609375, -0.02734375, 0.12255859375, 0.2724609375, 0.42236328125, 0.572265625, 0.72216796875, 0.8720703125, 1.02197265625, 1.171875, 1.32177734375, 1.4716796875, 1.62158203125, 1.771484375, 1.92138671875, 2.0712890625, 2.22119140625, 2.37109375, 2.52099609375, 2.6708984375, 2.82080078125, 2.970703125, 3.12060546875, 3.2705078125, 3.42041015625, 3.5703125, 3.72021484375, 3.8701171875, 4.02001953125, 4.169921875, 4.31982421875, 4.4697265625, 4.61962890625, 4.76953125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 11.0, 7.0, 15.0, 12.0, 10.0, 16.0, 18.0, 23.0, 25.0, 37.0, 51.0, 73.0, 103.0, 155.0, 290.0, 572.0, 1856.0, 24930.0, 2746057.0, 363908.0, 5446.0, 961.0, 404.0, 228.0, 131.0, 90.0, 62.0, 45.0, 23.0, 29.0, 22.0, 17.0, 18.0, 12.0, 15.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.65625, -9.352294921875, -9.04833984375, -8.744384765625, -8.4404296875, -8.136474609375, -7.83251953125, -7.528564453125, -7.224609375, -6.920654296875, -6.61669921875, -6.312744140625, -6.0087890625, -5.704833984375, -5.40087890625, -5.096923828125, -4.79296875, -4.489013671875, -4.18505859375, -3.881103515625, -3.5771484375, -3.273193359375, -2.96923828125, -2.665283203125, -2.361328125, -2.057373046875, -1.75341796875, -1.449462890625, -1.1455078125, -0.841552734375, -0.53759765625, -0.233642578125, 0.0703125, 0.374267578125, 0.67822265625, 0.982177734375, 1.2861328125, 1.590087890625, 1.89404296875, 2.197998046875, 2.501953125, 2.805908203125, 3.10986328125, 3.413818359375, 3.7177734375, 4.021728515625, 4.32568359375, 4.629638671875, 4.93359375, 5.237548828125, 5.54150390625, 5.845458984375, 6.1494140625, 6.453369140625, 6.75732421875, 7.061279296875, 7.365234375, 7.669189453125, 7.97314453125, 8.277099609375, 8.5810546875, 8.885009765625, 9.18896484375, 9.492919921875, 9.796875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 30.0, 100.0, 245.0, 326.0, 214.0, 72.0, 15.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.365718841552734, -26.832176208496094, -26.298633575439453, -25.765090942382812, -25.231548309326172, -24.698007583618164, -24.164464950561523, -23.630922317504883, -23.097379684448242, -22.5638370513916, -22.03029441833496, -21.49675178527832, -20.963211059570312, -20.429668426513672, -19.89612579345703, -19.36258316040039, -18.82904052734375, -18.29549789428711, -17.76195526123047, -17.228412628173828, -16.694869995117188, -16.16132926940918, -15.627786636352539, -15.094244003295898, -14.560701370239258, -14.027158737182617, -13.493616104125977, -12.960074424743652, -12.426531791687012, -11.892989158630371, -11.359447479248047, -10.825904846191406, -10.292362213134766, -9.758819580078125, -9.225276947021484, -8.69173526763916, -8.15819263458252, -7.624650001525879, -7.0911078453063965, -6.557565689086914, -6.024022579193115, -5.490480422973633, -4.956937789916992, -4.423395156860352, -3.889853000640869, -3.3563106060028076, -2.822768211364746, -2.2892258167266846, -1.755683422088623, -1.2221410274505615, -0.6885986328125, -0.15505623817443848, 0.37848615646362305, 0.9120285511016846, 1.445570945739746, 1.9791133403778076, 2.512655735015869, 3.0461981296539307, 3.579740524291992, 4.113283157348633, 4.646825313568115, 5.180367469787598, 5.713910102844238, 6.247452735900879, 6.780994892120361]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 5.0, 7.0, 8.0, 7.0, 15.0, 12.0, 12.0, 10.0, 21.0, 19.0, 18.0, 27.0, 31.0, 35.0, 40.0, 25.0, 37.0, 46.0, 39.0, 28.0, 42.0, 32.0, 32.0, 31.0, 31.0, 37.0, 36.0, 29.0, 34.0, 33.0, 32.0, 29.0, 13.0, 29.0, 19.0, 9.0, 11.0, 14.0, 9.0, 12.0, 8.0, 10.0, 9.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.07627010345459, -12.650373458862305, -12.224477767944336, -11.79858112335205, -11.372684478759766, -10.946788787841797, -10.520892143249512, -10.094995498657227, -9.669099807739258, -9.243203163146973, -8.817307472229004, -8.391410827636719, -7.965514659881592, -7.539618492126465, -7.11372184753418, -6.687825679779053, -6.261929035186768, -5.836032867431641, -5.4101362228393555, -4.9842400550842285, -4.558343887329102, -4.132447242736816, -3.7065510749816895, -3.2806549072265625, -2.8547585010528564, -2.4288620948791504, -2.0029659271240234, -1.5770695209503174, -1.1511732339859009, -0.7252769470214844, -0.2993805408477783, 0.12651562690734863, 0.5524120330810547, 0.9783083200454712, 1.4042046070098877, 1.8301010131835938, 2.2559971809387207, 2.6818935871124268, 3.107789993286133, 3.5336861610412598, 3.959582567214966, 4.385478973388672, 4.811375141143799, 5.237271308898926, 5.663167953491211, 6.089064121246338, 6.514960289001465, 6.94085693359375, 7.366753101348877, 7.792649269104004, 8.218545913696289, 8.644441604614258, 9.070338249206543, 9.496234893798828, 9.922130584716797, 10.348027229309082, 10.773923873901367, 11.199820518493652, 11.625716209411621, 12.051612854003906, 12.477509498596191, 12.90340518951416, 13.329301834106445, 13.755197525024414, 14.1810941696167]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 4.0, 5.0, 10.0, 3.0, 12.0, 15.0, 15.0, 20.0, 26.0, 22.0, 23.0, 28.0, 25.0, 36.0, 27.0, 37.0, 36.0, 47.0, 35.0, 47.0, 42.0, 47.0, 37.0, 33.0, 30.0, 36.0, 33.0, 37.0, 29.0, 28.0, 28.0, 21.0, 14.0, 18.0, 19.0, 15.0, 12.0, 11.0, 9.0, 8.0, 7.0, 1.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.5, -1.4578704833984375, -1.415740966796875, -1.3736114501953125, -1.33148193359375, -1.2893524169921875, -1.247222900390625, -1.2050933837890625, -1.1629638671875, -1.1208343505859375, -1.078704833984375, -1.0365753173828125, -0.99444580078125, -0.9523162841796875, -0.910186767578125, -0.8680572509765625, -0.825927734375, -0.7837982177734375, -0.741668701171875, -0.6995391845703125, -0.65740966796875, -0.6152801513671875, -0.573150634765625, -0.5310211181640625, -0.4888916015625, -0.4467620849609375, -0.404632568359375, -0.3625030517578125, -0.32037353515625, -0.2782440185546875, -0.236114501953125, -0.1939849853515625, -0.15185546875, -0.1097259521484375, -0.067596435546875, -0.0254669189453125, 0.01666259765625, 0.0587921142578125, 0.100921630859375, 0.1430511474609375, 0.1851806640625, 0.2273101806640625, 0.269439697265625, 0.3115692138671875, 0.35369873046875, 0.3958282470703125, 0.437957763671875, 0.4800872802734375, 0.522216796875, 0.5643463134765625, 0.606475830078125, 0.6486053466796875, 0.69073486328125, 0.7328643798828125, 0.774993896484375, 0.8171234130859375, 0.8592529296875, 0.9013824462890625, 0.943511962890625, 0.9856414794921875, 1.02777099609375, 1.0699005126953125, 1.112030029296875, 1.1541595458984375, 1.1962890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 6.0, 13.0, 14.0, 14.0, 20.0, 19.0, 38.0, 52.0, 56.0, 78.0, 106.0, 180.0, 341.0, 752.0, 2231.0, 9942.0, 75733.0, 1169697.0, 2659620.0, 245612.0, 23152.0, 4187.0, 1185.0, 468.0, 200.0, 161.0, 100.0, 55.0, 57.0, 50.0, 23.0, 16.0, 17.0, 14.0, 11.0, 21.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.65234375, -4.50335693359375, -4.3543701171875, -4.20538330078125, -4.056396484375, -3.90740966796875, -3.7584228515625, -3.60943603515625, -3.46044921875, -3.31146240234375, -3.1624755859375, -3.01348876953125, -2.864501953125, -2.71551513671875, -2.5665283203125, -2.41754150390625, -2.2685546875, -2.11956787109375, -1.9705810546875, -1.82159423828125, -1.672607421875, -1.52362060546875, -1.3746337890625, -1.22564697265625, -1.07666015625, -0.92767333984375, -0.7786865234375, -0.62969970703125, -0.480712890625, -0.33172607421875, -0.1827392578125, -0.03375244140625, 0.115234375, 0.26422119140625, 0.4132080078125, 0.56219482421875, 0.711181640625, 0.86016845703125, 1.0091552734375, 1.15814208984375, 1.30712890625, 1.45611572265625, 1.6051025390625, 1.75408935546875, 1.903076171875, 2.05206298828125, 2.2010498046875, 2.35003662109375, 2.4990234375, 2.64801025390625, 2.7969970703125, 2.94598388671875, 3.094970703125, 3.24395751953125, 3.3929443359375, 3.54193115234375, 3.69091796875, 3.83990478515625, 3.9888916015625, 4.13787841796875, 4.286865234375, 4.43585205078125, 4.5848388671875, 4.73382568359375, 4.8828125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 14.0, 19.0, 25.0, 43.0, 65.0, 111.0, 189.0, 287.0, 429.0, 561.0, 639.0, 530.0, 420.0, 256.0, 172.0, 113.0, 75.0, 62.0, 22.0, 10.0, 8.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.667510986328125, -8.46783447265625, -8.268157958984375, -8.0684814453125, -7.868804931640625, -7.66912841796875, -7.469451904296875, -7.269775390625, -7.070098876953125, -6.87042236328125, -6.670745849609375, -6.4710693359375, -6.271392822265625, -6.07171630859375, -5.872039794921875, -5.67236328125, -5.472686767578125, -5.27301025390625, -5.073333740234375, -4.8736572265625, -4.673980712890625, -4.47430419921875, -4.274627685546875, -4.074951171875, -3.875274658203125, -3.67559814453125, -3.475921630859375, -3.2762451171875, -3.076568603515625, -2.87689208984375, -2.677215576171875, -2.4775390625, -2.277862548828125, -2.07818603515625, -1.878509521484375, -1.6788330078125, -1.479156494140625, -1.27947998046875, -1.079803466796875, -0.880126953125, -0.680450439453125, -0.48077392578125, -0.281097412109375, -0.0814208984375, 0.118255615234375, 0.31793212890625, 0.517608642578125, 0.71728515625, 0.916961669921875, 1.11663818359375, 1.316314697265625, 1.5159912109375, 1.715667724609375, 1.91534423828125, 2.115020751953125, 2.314697265625, 2.514373779296875, 2.71405029296875, 2.913726806640625, 3.1134033203125, 3.313079833984375, 3.51275634765625, 3.712432861328125, 3.912109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 9.0, 16.0, 17.0, 51.0, 77.0, 138.0, 201.0, 445.0, 969.0, 5580.0, 250136.0, 3817389.0, 113831.0, 3874.0, 828.0, 314.0, 150.0, 106.0, 49.0, 30.0, 17.0, 21.0, 7.0, 7.0, 4.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.24267578125, -10.7822265625, -10.32177734375, -9.861328125, -9.40087890625, -8.9404296875, -8.47998046875, -8.01953125, -7.55908203125, -7.0986328125, -6.63818359375, -6.177734375, -5.71728515625, -5.2568359375, -4.79638671875, -4.3359375, -3.87548828125, -3.4150390625, -2.95458984375, -2.494140625, -2.03369140625, -1.5732421875, -1.11279296875, -0.65234375, -0.19189453125, 0.2685546875, 0.72900390625, 1.189453125, 1.64990234375, 2.1103515625, 2.57080078125, 3.03125, 3.49169921875, 3.9521484375, 4.41259765625, 4.873046875, 5.33349609375, 5.7939453125, 6.25439453125, 6.71484375, 7.17529296875, 7.6357421875, 8.09619140625, 8.556640625, 9.01708984375, 9.4775390625, 9.93798828125, 10.3984375, 10.85888671875, 11.3193359375, 11.77978515625, 12.240234375, 12.70068359375, 13.1611328125, 13.62158203125, 14.08203125, 14.54248046875, 15.0029296875, 15.46337890625, 15.923828125, 16.38427734375, 16.8447265625, 17.30517578125, 17.765625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 26.0, 42.0, 95.0, 138.0, 178.0, 174.0, 158.0, 92.0, 61.0, 29.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.693729400634766, -36.87528610229492, -36.05684280395508, -35.238399505615234, -34.41995620727539, -33.60151290893555, -32.7830696105957, -31.964624404907227, -31.146181106567383, -30.32773780822754, -29.509294509887695, -28.69085121154785, -27.872407913208008, -27.05396270751953, -26.235519409179688, -25.417076110839844, -24.5986328125, -23.780189514160156, -22.961746215820312, -22.14330291748047, -21.324859619140625, -20.50641632080078, -19.687973022460938, -18.86952781677246, -18.05108642578125, -17.232643127441406, -16.414199829101562, -15.595756530761719, -14.777312278747559, -13.958868980407715, -13.140425682067871, -12.321981430053711, -11.50353717803955, -10.685093879699707, -9.866650581359863, -9.048206329345703, -8.22976303100586, -7.411319732666016, -6.592876434326172, -5.77443265914917, -4.955989360809326, -4.137546062469482, -3.3191022872924805, -2.5006589889526367, -1.6822154521942139, -0.863771915435791, -0.045328617095947266, 0.7731151580810547, 1.5915584564208984, 2.4100019931793213, 3.228445529937744, 4.046888828277588, 4.86533260345459, 5.683775901794434, 6.502219200134277, 7.320662975311279, 8.139106750488281, 8.957550048828125, 9.775993347167969, 10.594436645507812, 11.412880897521973, 12.231324195861816, 13.04976749420166, 13.86821174621582, 14.686654090881348]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 2.0, 6.0, 8.0, 8.0, 9.0, 6.0, 11.0, 16.0, 20.0, 20.0, 13.0, 22.0, 22.0, 34.0, 40.0, 39.0, 29.0, 48.0, 29.0, 40.0, 41.0, 42.0, 52.0, 45.0, 50.0, 37.0, 38.0, 34.0, 35.0, 39.0, 22.0, 24.0, 21.0, 18.0, 14.0, 13.0, 8.0, 15.0, 11.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.780960083007812, -12.321908950805664, -11.8628568649292, -11.40380573272705, -10.944753646850586, -10.485702514648438, -10.026651382446289, -9.567599296569824, -9.10854721069336, -8.649496078491211, -8.190443992614746, -7.731392860412598, -7.272340774536133, -6.813289642333984, -6.354238033294678, -5.895186424255371, -5.436135292053223, -4.977083683013916, -4.518032073974609, -4.058980941772461, -3.599929094314575, -3.1408774852752686, -2.681826114654541, -2.2227745056152344, -1.7637228965759277, -1.304671287536621, -0.845619797706604, -0.3865683078765869, 0.07248330116271973, 0.5315349102020264, 0.9905862808227539, 1.4496378898620605, 1.9086894989013672, 2.367741107940674, 2.8267927169799805, 3.285844087600708, 3.7448956966400146, 4.203947067260742, 4.662998676300049, 5.1220502853393555, 5.581101894378662, 6.040153503417969, 6.499205112457275, 6.958256721496582, 7.4173078536987305, 7.876359939575195, 8.335411071777344, 8.794462203979492, 9.253514289855957, 9.712565422058105, 10.17161750793457, 10.630668640136719, 11.089720726013184, 11.548771858215332, 12.007823944091797, 12.466875076293945, 12.925926208496094, 13.384977340698242, 13.844029426574707, 14.303080558776855, 14.76213264465332, 15.221183776855469, 15.680234909057617, 16.139286041259766, 16.598339080810547]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 1.0, 10.0, 6.0, 13.0, 9.0, 16.0, 12.0, 13.0, 15.0, 31.0, 25.0, 21.0, 26.0, 37.0, 35.0, 37.0, 43.0, 46.0, 28.0, 52.0, 45.0, 41.0, 48.0, 39.0, 37.0, 44.0, 33.0, 30.0, 35.0, 27.0, 20.0, 22.0, 19.0, 16.0, 14.0, 8.0, 7.0, 10.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5255889892578125, -1.479888916015625, -1.4341888427734375, -1.38848876953125, -1.3427886962890625, -1.297088623046875, -1.2513885498046875, -1.2056884765625, -1.1599884033203125, -1.114288330078125, -1.0685882568359375, -1.02288818359375, -0.9771881103515625, -0.931488037109375, -0.8857879638671875, -0.840087890625, -0.7943878173828125, -0.748687744140625, -0.7029876708984375, -0.65728759765625, -0.6115875244140625, -0.565887451171875, -0.5201873779296875, -0.4744873046875, -0.4287872314453125, -0.383087158203125, -0.3373870849609375, -0.29168701171875, -0.2459869384765625, -0.200286865234375, -0.1545867919921875, -0.10888671875, -0.0631866455078125, -0.017486572265625, 0.0282135009765625, 0.07391357421875, 0.1196136474609375, 0.165313720703125, 0.2110137939453125, 0.2567138671875, 0.3024139404296875, 0.348114013671875, 0.3938140869140625, 0.43951416015625, 0.4852142333984375, 0.530914306640625, 0.5766143798828125, 0.622314453125, 0.6680145263671875, 0.713714599609375, 0.7594146728515625, 0.80511474609375, 0.8508148193359375, 0.896514892578125, 0.9422149658203125, 0.9879150390625, 1.0336151123046875, 1.079315185546875, 1.1250152587890625, 1.17071533203125, 1.2164154052734375, 1.262115478515625, 1.3078155517578125, 1.353515625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 7.0, 19.0, 17.0, 28.0, 43.0, 69.0, 92.0, 163.0, 239.0, 372.0, 528.0, 827.0, 1158.0, 1796.0, 2686.0, 4127.0, 6341.0, 9832.0, 15289.0, 24334.0, 39818.0, 68350.0, 134376.0, 311537.0, 200655.0, 91117.0, 50681.0, 30392.0, 18971.0, 12096.0, 7802.0, 4993.0, 3337.0, 2127.0, 1415.0, 980.0, 673.0, 461.0, 263.0, 184.0, 137.0, 78.0, 54.0, 36.0, 20.0, 15.0, 5.0, 8.0, 3.0, 2.0, 6.0, 1.0, 2.0], "bins": [-0.301025390625, -0.2923583984375, -0.28369140625, -0.2750244140625, -0.266357421875, -0.2576904296875, -0.2490234375, -0.2403564453125, -0.231689453125, -0.2230224609375, -0.21435546875, -0.2056884765625, -0.197021484375, -0.1883544921875, -0.1796875, -0.1710205078125, -0.162353515625, -0.1536865234375, -0.14501953125, -0.1363525390625, -0.127685546875, -0.1190185546875, -0.1103515625, -0.1016845703125, -0.093017578125, -0.0843505859375, -0.07568359375, -0.0670166015625, -0.058349609375, -0.0496826171875, -0.041015625, -0.0323486328125, -0.023681640625, -0.0150146484375, -0.00634765625, 0.0023193359375, 0.010986328125, 0.0196533203125, 0.0283203125, 0.0369873046875, 0.045654296875, 0.0543212890625, 0.06298828125, 0.0716552734375, 0.080322265625, 0.0889892578125, 0.09765625, 0.1063232421875, 0.114990234375, 0.1236572265625, 0.13232421875, 0.1409912109375, 0.149658203125, 0.1583251953125, 0.1669921875, 0.1756591796875, 0.184326171875, 0.1929931640625, 0.20166015625, 0.2103271484375, 0.218994140625, 0.2276611328125, 0.236328125, 0.2449951171875, 0.253662109375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 13.0, 7.0, 9.0, 12.0, 14.0, 17.0, 14.0, 27.0, 27.0, 18.0, 29.0, 31.0, 33.0, 42.0, 29.0, 45.0, 35.0, 47.0, 1056.0, 47.0, 43.0, 45.0, 29.0, 43.0, 31.0, 47.0, 23.0, 30.0, 35.0, 24.0, 33.0, 17.0, 8.0, 16.0, 15.0, 3.0, 14.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.88671875, -0.8589859008789062, -0.8312530517578125, -0.8035202026367188, -0.775787353515625, -0.7480545043945312, -0.7203216552734375, -0.6925888061523438, -0.66485595703125, -0.6371231079101562, -0.6093902587890625, -0.5816574096679688, -0.553924560546875, -0.5261917114257812, -0.4984588623046875, -0.47072601318359375, -0.4429931640625, -0.41526031494140625, -0.3875274658203125, -0.35979461669921875, -0.332061767578125, -0.30432891845703125, -0.2765960693359375, -0.24886322021484375, -0.22113037109375, -0.19339752197265625, -0.1656646728515625, -0.13793182373046875, -0.110198974609375, -0.08246612548828125, -0.0547332763671875, -0.02700042724609375, 0.000732421875, 0.02846527099609375, 0.0561981201171875, 0.08393096923828125, 0.111663818359375, 0.13939666748046875, 0.1671295166015625, 0.19486236572265625, 0.22259521484375, 0.25032806396484375, 0.2780609130859375, 0.30579376220703125, 0.333526611328125, 0.36125946044921875, 0.3889923095703125, 0.41672515869140625, 0.4444580078125, 0.47219085693359375, 0.4999237060546875, 0.5276565551757812, 0.555389404296875, 0.5831222534179688, 0.6108551025390625, 0.6385879516601562, 0.66632080078125, 0.6940536499023438, 0.7217864990234375, 0.7495193481445312, 0.777252197265625, 0.8049850463867188, 0.8327178955078125, 0.8604507446289062, 0.88818359375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 14.0, 21.0, 25.0, 38.0, 62.0, 78.0, 121.0, 186.0, 257.0, 402.0, 610.0, 901.0, 1438.0, 2098.0, 3247.0, 5145.0, 7987.0, 12615.0, 19977.0, 33368.0, 55336.0, 99462.0, 209679.0, 1333621.0, 132897.0, 69595.0, 40969.0, 24646.0, 15078.0, 9653.0, 6208.0, 3974.0, 2524.0, 1687.0, 1079.0, 693.0, 445.0, 313.0, 206.0, 144.0, 100.0, 65.0, 48.0, 40.0, 29.0, 18.0, 9.0, 7.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2445068359375, -0.23691558837890625, -0.2293243408203125, -0.22173309326171875, -0.214141845703125, -0.20655059814453125, -0.1989593505859375, -0.19136810302734375, -0.18377685546875, -0.17618560791015625, -0.1685943603515625, -0.16100311279296875, -0.153411865234375, -0.14582061767578125, -0.1382293701171875, -0.13063812255859375, -0.123046875, -0.11545562744140625, -0.1078643798828125, -0.10027313232421875, -0.092681884765625, -0.08509063720703125, -0.0774993896484375, -0.06990814208984375, -0.06231689453125, -0.05472564697265625, -0.0471343994140625, -0.03954315185546875, -0.031951904296875, -0.02436065673828125, -0.0167694091796875, -0.00917816162109375, -0.0015869140625, 0.00600433349609375, 0.0135955810546875, 0.02118682861328125, 0.028778076171875, 0.03636932373046875, 0.0439605712890625, 0.05155181884765625, 0.05914306640625, 0.06673431396484375, 0.0743255615234375, 0.08191680908203125, 0.089508056640625, 0.09709930419921875, 0.1046905517578125, 0.11228179931640625, 0.119873046875, 0.12746429443359375, 0.1350555419921875, 0.14264678955078125, 0.150238037109375, 0.15782928466796875, 0.1654205322265625, 0.17301177978515625, 0.18060302734375, 0.18819427490234375, 0.1957855224609375, 0.20337677001953125, 0.210968017578125, 0.21855926513671875, 0.2261505126953125, 0.23374176025390625, 0.2413330078125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 6.0, 6.0, 4.0, 5.0, 8.0, 12.0, 11.0, 8.0, 21.0, 25.0, 19.0, 30.0, 26.0, 40.0, 43.0, 47.0, 46.0, 44.0, 46.0, 55.0, 55.0, 51.0, 55.0, 40.0, 43.0, 38.0, 40.0, 31.0, 22.0, 18.0, 20.0, 15.0, 19.0, 12.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0001678466796875, -0.00016313977539539337, -0.00015843287110328674, -0.00015372596681118011, -0.00014901906251907349, -0.00014431215822696686, -0.00013960525393486023, -0.0001348983496427536, -0.00013019144535064697, -0.00012548454105854034, -0.00012077763676643372, -0.00011607073247432709, -0.00011136382818222046, -0.00010665692389011383, -0.0001019500195980072, -9.724311530590057e-05, -9.253621101379395e-05, -8.782930672168732e-05, -8.312240242958069e-05, -7.841549813747406e-05, -7.370859384536743e-05, -6.90016895532608e-05, -6.429478526115417e-05, -5.9587880969047546e-05, -5.488097667694092e-05, -5.017407238483429e-05, -4.546716809272766e-05, -4.076026380062103e-05, -3.6053359508514404e-05, -3.1346455216407776e-05, -2.6639550924301147e-05, -2.193264663219452e-05, -1.722574234008789e-05, -1.2518838047981262e-05, -7.811933755874634e-06, -3.1050294637680054e-06, 1.601874828338623e-06, 6.3087791204452515e-06, 1.101568341255188e-05, 1.5722587704658508e-05, 2.0429491996765137e-05, 2.5136396288871765e-05, 2.9843300580978394e-05, 3.455020487308502e-05, 3.925710916519165e-05, 4.396401345729828e-05, 4.867091774940491e-05, 5.3377822041511536e-05, 5.8084726333618164e-05, 6.279163062572479e-05, 6.749853491783142e-05, 7.220543920993805e-05, 7.691234350204468e-05, 8.16192477941513e-05, 8.632615208625793e-05, 9.103305637836456e-05, 9.573996067047119e-05, 0.00010044686496257782, 0.00010515376925468445, 0.00010986067354679108, 0.0001145675778388977, 0.00011927448213100433, 0.00012398138642311096, 0.0001286882907152176, 0.00013339519500732422]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 12.0, 10.0, 17.0, 12.0, 20.0, 35.0, 27.0, 54.0, 64.0, 79.0, 101.0, 124.0, 161.0, 206.0, 323.0, 548.0, 2892.0, 980844.0, 60567.0, 947.0, 408.0, 295.0, 195.0, 153.0, 93.0, 95.0, 54.0, 53.0, 34.0, 25.0, 40.0, 13.0, 18.0, 6.0, 5.0, 4.0, 2.0, 0.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025768280029296875, -0.0024839043617248535, -0.0023909807205200195, -0.0022980570793151855, -0.0022051334381103516, -0.0021122097969055176, -0.0020192861557006836, -0.0019263625144958496, -0.0018334388732910156, -0.0017405152320861816, -0.0016475915908813477, -0.0015546679496765137, -0.0014617443084716797, -0.0013688206672668457, -0.0012758970260620117, -0.0011829733848571777, -0.0010900497436523438, -0.0009971261024475098, -0.0009042024612426758, -0.0008112788200378418, -0.0007183551788330078, -0.0006254315376281738, -0.0005325078964233398, -0.00043958425521850586, -0.0003466606140136719, -0.0002537369728088379, -0.0001608133316040039, -6.788969039916992e-05, 2.5033950805664062e-05, 0.00011795759201049805, 0.00021088123321533203, 0.000303804874420166, 0.000396728515625, 0.000489652156829834, 0.000582575798034668, 0.000675499439239502, 0.0007684230804443359, 0.0008613467216491699, 0.0009542703628540039, 0.0010471940040588379, 0.0011401176452636719, 0.0012330412864685059, 0.0013259649276733398, 0.0014188885688781738, 0.0015118122100830078, 0.0016047358512878418, 0.0016976594924926758, 0.0017905831336975098, 0.0018835067749023438, 0.0019764304161071777, 0.0020693540573120117, 0.0021622776985168457, 0.0022552013397216797, 0.0023481249809265137, 0.0024410486221313477, 0.0025339722633361816, 0.0026268959045410156, 0.0027198195457458496, 0.0028127431869506836, 0.0029056668281555176, 0.0029985904693603516, 0.0030915141105651855, 0.0031844377517700195, 0.0032773613929748535, 0.0033702850341796875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 45.0, 175.0, 337.0, 286.0, 121.0, 39.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024024049344006926, -0.00023130580666474998, -0.00022237110533751547, -0.0002134364185621962, -0.00020450173178687692, -0.0001955670304596424, -0.00018663234368432313, -0.00017769765690900385, -0.00016876295558176935, -0.00015982826880645007, -0.00015089356747921556, -0.00014195888070389628, -0.000133024193928577, -0.00012408950715325773, -0.00011515480582602322, -0.00010622011905070394, -9.728543227538466e-05, -8.835073822410777e-05, -7.94160514487885e-05, -7.04813573975116e-05, -6.154667062219232e-05, -5.261197657091543e-05, -4.367728251963854e-05, -3.474259574431926e-05, -2.5807901693042368e-05, -1.6873211279744282e-05, -7.938519047456793e-06, 9.961731848306954e-07, 9.93086359812878e-06, 1.8865554011426866e-05, 2.780024806270376e-05, 3.673493483802304e-05, 4.566964344121516e-05, 5.460433385451324e-05, 6.353902426781133e-05, 7.247371831908822e-05, 8.14084050944075e-05, 9.034309914568439e-05, 9.927779319696128e-05, 0.00010821247997228056, 0.00011714717402355745, 0.00012608186807483435, 0.00013501655485015363, 0.0001439512416254729, 0.0001528859429527074, 0.0001618206297280267, 0.00017075531650334597, 0.00017969001783058047, 0.00018862470460589975, 0.00019755939138121903, 0.00020649409270845354, 0.00021542877948377281, 0.0002243634662590921, 0.0002332981675863266, 0.00024223285436164588, 0.00025116754113696516, 0.00026010224246419966, 0.00026903694379143417, 0.0002779716160148382, 0.0002869063173420727, 0.00029584101866930723, 0.0003047756908927113, 0.0003137103922199458, 0.00032264506444334984, 0.00033157976577058434]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 7.0, 8.0, 11.0, 13.0, 26.0, 17.0, 25.0, 26.0, 22.0, 25.0, 28.0, 35.0, 35.0, 33.0, 24.0, 48.0, 43.0, 42.0, 41.0, 54.0, 30.0, 45.0, 41.0, 28.0, 30.0, 32.0, 16.0, 39.0, 21.0, 29.0, 21.0, 18.0, 16.0, 15.0, 10.0, 13.0, 5.0, 4.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.417533874511719e-05, -9.147822856903076e-05, -8.878111839294434e-05, -8.608400821685791e-05, -8.338689804077148e-05, -8.068978786468506e-05, -7.799267768859863e-05, -7.529556751251221e-05, -7.259845733642578e-05, -6.990134716033936e-05, -6.720423698425293e-05, -6.45071268081665e-05, -6.181001663208008e-05, -5.911290645599365e-05, -5.6415796279907227e-05, -5.37186861038208e-05, -5.1021575927734375e-05, -4.832446575164795e-05, -4.5627355575561523e-05, -4.29302453994751e-05, -4.023313522338867e-05, -3.7536025047302246e-05, -3.483891487121582e-05, -3.2141804695129395e-05, -2.944469451904297e-05, -2.6747584342956543e-05, -2.4050474166870117e-05, -2.135336399078369e-05, -1.8656253814697266e-05, -1.595914363861084e-05, -1.3262033462524414e-05, -1.0564923286437988e-05, -7.867813110351562e-06, -5.170702934265137e-06, -2.473592758178711e-06, 2.2351741790771484e-07, 2.9206275939941406e-06, 5.617737770080566e-06, 8.314847946166992e-06, 1.1011958122253418e-05, 1.3709068298339844e-05, 1.640617847442627e-05, 1.9103288650512695e-05, 2.180039882659912e-05, 2.4497509002685547e-05, 2.7194619178771973e-05, 2.98917293548584e-05, 3.2588839530944824e-05, 3.528594970703125e-05, 3.7983059883117676e-05, 4.06801700592041e-05, 4.337728023529053e-05, 4.607439041137695e-05, 4.877150058746338e-05, 5.1468610763549805e-05, 5.416572093963623e-05, 5.6862831115722656e-05, 5.955994129180908e-05, 6.225705146789551e-05, 6.495416164398193e-05, 6.765127182006836e-05, 7.034838199615479e-05, 7.304549217224121e-05, 7.574260234832764e-05, 7.843971252441406e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 1.0, 10.0, 6.0, 13.0, 9.0, 16.0, 12.0, 13.0, 15.0, 31.0, 25.0, 21.0, 26.0, 37.0, 35.0, 37.0, 43.0, 46.0, 28.0, 52.0, 45.0, 41.0, 48.0, 39.0, 37.0, 44.0, 33.0, 30.0, 35.0, 27.0, 20.0, 22.0, 19.0, 16.0, 14.0, 8.0, 7.0, 10.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5255889892578125, -1.479888916015625, -1.4341888427734375, -1.38848876953125, -1.3427886962890625, -1.297088623046875, -1.2513885498046875, -1.2056884765625, -1.1599884033203125, -1.114288330078125, -1.0685882568359375, -1.02288818359375, -0.9771881103515625, -0.931488037109375, -0.8857879638671875, -0.840087890625, -0.7943878173828125, -0.748687744140625, -0.7029876708984375, -0.65728759765625, -0.6115875244140625, -0.565887451171875, -0.5201873779296875, -0.4744873046875, -0.4287872314453125, -0.383087158203125, -0.3373870849609375, -0.29168701171875, -0.2459869384765625, -0.200286865234375, -0.1545867919921875, -0.10888671875, -0.0631866455078125, -0.017486572265625, 0.0282135009765625, 0.07391357421875, 0.1196136474609375, 0.165313720703125, 0.2110137939453125, 0.2567138671875, 0.3024139404296875, 0.348114013671875, 0.3938140869140625, 0.43951416015625, 0.4852142333984375, 0.530914306640625, 0.5766143798828125, 0.622314453125, 0.6680145263671875, 0.713714599609375, 0.7594146728515625, 0.80511474609375, 0.8508148193359375, 0.896514892578125, 0.9422149658203125, 0.9879150390625, 1.0336151123046875, 1.079315185546875, 1.1250152587890625, 1.17071533203125, 1.2164154052734375, 1.262115478515625, 1.3078155517578125, 1.353515625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 7.0, 8.0, 15.0, 15.0, 15.0, 36.0, 41.0, 56.0, 84.0, 93.0, 117.0, 144.0, 237.0, 312.0, 386.0, 677.0, 1065.0, 1561.0, 2738.0, 4788.0, 8808.0, 17480.0, 36762.0, 86699.0, 216883.0, 357714.0, 176669.0, 70469.0, 30908.0, 15003.0, 7761.0, 4166.0, 2349.0, 1490.0, 926.0, 592.0, 405.0, 283.0, 205.0, 151.0, 107.0, 86.0, 67.0, 45.0, 39.0, 26.0, 18.0, 16.0, 11.0, 8.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.4716796875, -1.426239013671875, -1.38079833984375, -1.335357666015625, -1.2899169921875, -1.244476318359375, -1.19903564453125, -1.153594970703125, -1.108154296875, -1.062713623046875, -1.01727294921875, -0.971832275390625, -0.9263916015625, -0.880950927734375, -0.83551025390625, -0.790069580078125, -0.74462890625, -0.699188232421875, -0.65374755859375, -0.608306884765625, -0.5628662109375, -0.517425537109375, -0.47198486328125, -0.426544189453125, -0.381103515625, -0.335662841796875, -0.29022216796875, -0.244781494140625, -0.1993408203125, -0.153900146484375, -0.10845947265625, -0.063018798828125, -0.017578125, 0.027862548828125, 0.07330322265625, 0.118743896484375, 0.1641845703125, 0.209625244140625, 0.25506591796875, 0.300506591796875, 0.345947265625, 0.391387939453125, 0.43682861328125, 0.482269287109375, 0.5277099609375, 0.573150634765625, 0.61859130859375, 0.664031982421875, 0.70947265625, 0.754913330078125, 0.80035400390625, 0.845794677734375, 0.8912353515625, 0.936676025390625, 0.98211669921875, 1.027557373046875, 1.072998046875, 1.118438720703125, 1.16387939453125, 1.209320068359375, 1.2547607421875, 1.300201416015625, 1.34564208984375, 1.391082763671875, 1.4365234375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 5.0, 7.0, 2.0, 12.0, 9.0, 12.0, 17.0, 13.0, 26.0, 19.0, 20.0, 35.0, 30.0, 32.0, 40.0, 40.0, 42.0, 60.0, 77.0, 220.0, 1505.0, 288.0, 102.0, 59.0, 59.0, 30.0, 28.0, 40.0, 29.0, 30.0, 25.0, 25.0, 19.0, 21.0, 12.0, 13.0, 7.0, 5.0, 8.0, 6.0, 1.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.76275634765625, -4.6075439453125, -4.45233154296875, -4.297119140625, -4.14190673828125, -3.9866943359375, -3.83148193359375, -3.67626953125, -3.52105712890625, -3.3658447265625, -3.21063232421875, -3.055419921875, -2.90020751953125, -2.7449951171875, -2.58978271484375, -2.4345703125, -2.27935791015625, -2.1241455078125, -1.96893310546875, -1.813720703125, -1.65850830078125, -1.5032958984375, -1.34808349609375, -1.19287109375, -1.03765869140625, -0.8824462890625, -0.72723388671875, -0.572021484375, -0.41680908203125, -0.2615966796875, -0.10638427734375, 0.048828125, 0.20404052734375, 0.3592529296875, 0.51446533203125, 0.669677734375, 0.82489013671875, 0.9801025390625, 1.13531494140625, 1.29052734375, 1.44573974609375, 1.6009521484375, 1.75616455078125, 1.911376953125, 2.06658935546875, 2.2218017578125, 2.37701416015625, 2.5322265625, 2.68743896484375, 2.8426513671875, 2.99786376953125, 3.153076171875, 3.30828857421875, 3.4635009765625, 3.61871337890625, 3.77392578125, 3.92913818359375, 4.0843505859375, 4.23956298828125, 4.394775390625, 4.54998779296875, 4.7052001953125, 4.86041259765625, 5.015625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 8.0, 9.0, 11.0, 9.0, 16.0, 23.0, 29.0, 30.0, 36.0, 51.0, 83.0, 98.0, 156.0, 293.0, 687.0, 2709.0, 42081.0, 2906076.0, 185113.0, 6097.0, 1011.0, 330.0, 198.0, 147.0, 97.0, 67.0, 47.0, 27.0, 37.0, 25.0, 23.0, 20.0, 8.0, 8.0, 5.0, 9.0, 5.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-10.1640625, -9.879150390625, -9.59423828125, -9.309326171875, -9.0244140625, -8.739501953125, -8.45458984375, -8.169677734375, -7.884765625, -7.599853515625, -7.31494140625, -7.030029296875, -6.7451171875, -6.460205078125, -6.17529296875, -5.890380859375, -5.60546875, -5.320556640625, -5.03564453125, -4.750732421875, -4.4658203125, -4.180908203125, -3.89599609375, -3.611083984375, -3.326171875, -3.041259765625, -2.75634765625, -2.471435546875, -2.1865234375, -1.901611328125, -1.61669921875, -1.331787109375, -1.046875, -0.761962890625, -0.47705078125, -0.192138671875, 0.0927734375, 0.377685546875, 0.66259765625, 0.947509765625, 1.232421875, 1.517333984375, 1.80224609375, 2.087158203125, 2.3720703125, 2.656982421875, 2.94189453125, 3.226806640625, 3.51171875, 3.796630859375, 4.08154296875, 4.366455078125, 4.6513671875, 4.936279296875, 5.22119140625, 5.506103515625, 5.791015625, 6.075927734375, 6.36083984375, 6.645751953125, 6.9306640625, 7.215576171875, 7.50048828125, 7.785400390625, 8.0703125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 20.0, 135.0, 366.0, 348.0, 122.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.35190200805664, -14.58341121673584, -13.814920425415039, -13.046428680419922, -12.277938842773438, -11.50944709777832, -10.74095630645752, -9.972465515136719, -9.203974723815918, -8.435483932495117, -7.666993141174316, -6.898501873016357, -6.130011081695557, -5.361520290374756, -4.593029022216797, -3.824538230895996, -3.0560474395751953, -2.2875566482543945, -1.5190656185150146, -0.7505745887756348, 0.017916202545166016, 0.7864069938659668, 1.5548982620239258, 2.3233890533447266, 3.0918798446655273, 3.860370635986328, 4.628861427307129, 5.397352695465088, 6.165843486785889, 6.9343342781066895, 7.702825546264648, 8.47131633758545, 9.23980712890625, 10.00829792022705, 10.776788711547852, 11.545280456542969, 12.313770294189453, 13.08226203918457, 13.850752830505371, 14.619243621826172, 15.387734413146973, 16.156225204467773, 16.92471694946289, 17.693206787109375, 18.461698532104492, 19.230188369750977, 19.998680114746094, 20.767169952392578, 21.535661697387695, 22.304153442382812, 23.072643280029297, 23.841135025024414, 24.6096248626709, 25.378116607666016, 26.1466064453125, 26.915098190307617, 27.683589935302734, 28.45208168029785, 29.220571517944336, 29.989063262939453, 30.757553100585938, 31.526044845581055, 32.29453659057617, 33.063026428222656, 33.83151626586914]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 10.0, 7.0, 18.0, 20.0, 15.0, 21.0, 23.0, 32.0, 18.0, 33.0, 38.0, 26.0, 46.0, 41.0, 35.0, 44.0, 34.0, 49.0, 57.0, 42.0, 30.0, 29.0, 33.0, 29.0, 37.0, 37.0, 31.0, 20.0, 19.0, 22.0, 14.0, 11.0, 9.0, 12.0, 11.0, 6.0, 7.0, 11.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.569936752319336, -17.070125579833984, -16.5703125, -16.07050132751465, -15.57068920135498, -15.070877075195312, -14.571064949035645, -14.071252822875977, -13.571441650390625, -13.071629524230957, -12.571817398071289, -12.072006225585938, -11.57219409942627, -11.072381973266602, -10.572569847106934, -10.072757720947266, -9.572946548461914, -9.073134422302246, -8.573322296142578, -8.073511123657227, -7.573698997497559, -7.073886871337891, -6.574074745178223, -6.074263095855713, -5.574450492858887, -5.074638366699219, -4.574826717376709, -4.075014591217041, -3.5752029418945312, -3.0753908157348633, -2.5755789279937744, -2.0757670402526855, -1.5759553909301758, -1.076143503189087, -0.5763315558433533, -0.07651960849761963, 0.42329227924346924, 0.9231042861938477, 1.4229161739349365, 1.9227280616760254, 2.4225399494171143, 2.922351837158203, 3.422163724899292, 3.921975612640381, 4.421787738800049, 4.921599388122559, 5.421411514282227, 5.9212236404418945, 6.421035289764404, 6.920847415924072, 7.420659065246582, 7.92047119140625, 8.420283317565918, 8.920095443725586, 9.419906616210938, 9.919718742370605, 10.419530868530273, 10.919342994689941, 11.41915512084961, 11.918966293334961, 12.418778419494629, 12.918590545654297, 13.418402671813965, 13.918214797973633, 14.418025970458984]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 11.0, 12.0, 15.0, 8.0, 15.0, 17.0, 16.0, 19.0, 20.0, 19.0, 27.0, 29.0, 39.0, 35.0, 35.0, 39.0, 34.0, 41.0, 48.0, 51.0, 35.0, 41.0, 35.0, 44.0, 36.0, 32.0, 36.0, 31.0, 20.0, 29.0, 24.0, 11.0, 19.0, 19.0, 5.0, 8.0, 9.0, 7.0, 5.0, 8.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6611328125, -1.6137237548828125, -1.566314697265625, -1.5189056396484375, -1.47149658203125, -1.4240875244140625, -1.376678466796875, -1.3292694091796875, -1.2818603515625, -1.2344512939453125, -1.187042236328125, -1.1396331787109375, -1.09222412109375, -1.0448150634765625, -0.997406005859375, -0.9499969482421875, -0.902587890625, -0.8551788330078125, -0.807769775390625, -0.7603607177734375, -0.71295166015625, -0.6655426025390625, -0.618133544921875, -0.5707244873046875, -0.5233154296875, -0.4759063720703125, -0.428497314453125, -0.3810882568359375, -0.33367919921875, -0.2862701416015625, -0.238861083984375, -0.1914520263671875, -0.14404296875, -0.0966339111328125, -0.049224853515625, -0.0018157958984375, 0.04559326171875, 0.0930023193359375, 0.140411376953125, 0.1878204345703125, 0.2352294921875, 0.2826385498046875, 0.330047607421875, 0.3774566650390625, 0.42486572265625, 0.4722747802734375, 0.519683837890625, 0.5670928955078125, 0.614501953125, 0.6619110107421875, 0.709320068359375, 0.7567291259765625, 0.80413818359375, 0.8515472412109375, 0.898956298828125, 0.9463653564453125, 0.9937744140625, 1.0411834716796875, 1.088592529296875, 1.1360015869140625, 1.18341064453125, 1.2308197021484375, 1.278228759765625, 1.3256378173828125, 1.373046875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 11.0, 8.0, 12.0, 19.0, 13.0, 14.0, 16.0, 11.0, 13.0, 27.0, 20.0, 35.0, 49.0, 69.0, 136.0, 369.0, 1585.0, 11554.0, 330566.0, 3574222.0, 262910.0, 10400.0, 1398.0, 357.0, 125.0, 50.0, 32.0, 37.0, 37.0, 28.0, 18.0, 27.0, 15.0, 15.0, 14.0, 14.0, 10.0, 5.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-7.87109375, -7.64276123046875, -7.4144287109375, -7.18609619140625, -6.957763671875, -6.72943115234375, -6.5010986328125, -6.27276611328125, -6.04443359375, -5.81610107421875, -5.5877685546875, -5.35943603515625, -5.131103515625, -4.90277099609375, -4.6744384765625, -4.44610595703125, -4.2177734375, -3.98944091796875, -3.7611083984375, -3.53277587890625, -3.304443359375, -3.07611083984375, -2.8477783203125, -2.61944580078125, -2.39111328125, -2.16278076171875, -1.9344482421875, -1.70611572265625, -1.477783203125, -1.24945068359375, -1.0211181640625, -0.79278564453125, -0.564453125, -0.33612060546875, -0.1077880859375, 0.12054443359375, 0.348876953125, 0.57720947265625, 0.8055419921875, 1.03387451171875, 1.26220703125, 1.49053955078125, 1.7188720703125, 1.94720458984375, 2.175537109375, 2.40386962890625, 2.6322021484375, 2.86053466796875, 3.0888671875, 3.31719970703125, 3.5455322265625, 3.77386474609375, 4.002197265625, 4.23052978515625, 4.4588623046875, 4.68719482421875, 4.91552734375, 5.14385986328125, 5.3721923828125, 5.60052490234375, 5.828857421875, 6.05718994140625, 6.2855224609375, 6.51385498046875, 6.7421875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 6.0, 15.0, 16.0, 30.0, 28.0, 45.0, 57.0, 82.0, 123.0, 174.0, 239.0, 286.0, 395.0, 487.0, 452.0, 392.0, 329.0, 262.0, 168.0, 132.0, 89.0, 63.0, 45.0, 36.0, 19.0, 27.0, 25.0, 10.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.138763427734375, -5.00018310546875, -4.861602783203125, -4.7230224609375, -4.584442138671875, -4.44586181640625, -4.307281494140625, -4.168701171875, -4.030120849609375, -3.89154052734375, -3.752960205078125, -3.6143798828125, -3.475799560546875, -3.33721923828125, -3.198638916015625, -3.06005859375, -2.921478271484375, -2.78289794921875, -2.644317626953125, -2.5057373046875, -2.367156982421875, -2.22857666015625, -2.089996337890625, -1.951416015625, -1.812835693359375, -1.67425537109375, -1.535675048828125, -1.3970947265625, -1.258514404296875, -1.11993408203125, -0.981353759765625, -0.8427734375, -0.704193115234375, -0.56561279296875, -0.427032470703125, -0.2884521484375, -0.149871826171875, -0.01129150390625, 0.127288818359375, 0.265869140625, 0.404449462890625, 0.54302978515625, 0.681610107421875, 0.8201904296875, 0.958770751953125, 1.09735107421875, 1.235931396484375, 1.37451171875, 1.513092041015625, 1.65167236328125, 1.790252685546875, 1.9288330078125, 2.067413330078125, 2.20599365234375, 2.344573974609375, 2.483154296875, 2.621734619140625, 2.76031494140625, 2.898895263671875, 3.0374755859375, 3.176055908203125, 3.31463623046875, 3.453216552734375, 3.591796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 12.0, 13.0, 18.0, 30.0, 30.0, 49.0, 42.0, 87.0, 125.0, 175.0, 289.0, 689.0, 2296.0, 16871.0, 521574.0, 3496196.0, 145684.0, 7594.0, 1375.0, 439.0, 243.0, 136.0, 91.0, 59.0, 43.0, 32.0, 26.0, 13.0, 12.0, 5.0, 10.0, 7.0, 4.0, 6.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.546875, -11.166259765625, -10.78564453125, -10.405029296875, -10.0244140625, -9.643798828125, -9.26318359375, -8.882568359375, -8.501953125, -8.121337890625, -7.74072265625, -7.360107421875, -6.9794921875, -6.598876953125, -6.21826171875, -5.837646484375, -5.45703125, -5.076416015625, -4.69580078125, -4.315185546875, -3.9345703125, -3.553955078125, -3.17333984375, -2.792724609375, -2.412109375, -2.031494140625, -1.65087890625, -1.270263671875, -0.8896484375, -0.509033203125, -0.12841796875, 0.252197265625, 0.6328125, 1.013427734375, 1.39404296875, 1.774658203125, 2.1552734375, 2.535888671875, 2.91650390625, 3.297119140625, 3.677734375, 4.058349609375, 4.43896484375, 4.819580078125, 5.2001953125, 5.580810546875, 5.96142578125, 6.342041015625, 6.72265625, 7.103271484375, 7.48388671875, 7.864501953125, 8.2451171875, 8.625732421875, 9.00634765625, 9.386962890625, 9.767578125, 10.148193359375, 10.52880859375, 10.909423828125, 11.2900390625, 11.670654296875, 12.05126953125, 12.431884765625, 12.8125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 14.0, 35.0, 38.0, 64.0, 90.0, 103.0, 111.0, 114.0, 101.0, 113.0, 81.0, 56.0, 31.0, 15.0, 18.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.88625717163086, -26.293231964111328, -25.700204849243164, -25.107179641723633, -24.51415252685547, -23.921127319335938, -23.328102111816406, -22.735076904296875, -22.14204978942871, -21.54902458190918, -20.955997467041016, -20.362972259521484, -19.769947052001953, -19.17691993713379, -18.583894729614258, -17.990867614746094, -17.397842407226562, -16.80481719970703, -16.211790084838867, -15.618764877319336, -15.025738716125488, -14.43271255493164, -13.83968734741211, -13.246661186218262, -12.653635025024414, -12.060608863830566, -11.467582702636719, -10.874557495117188, -10.28153133392334, -9.688505172729492, -9.095479965209961, -8.502453804016113, -7.909427642822266, -7.316401481628418, -6.7233757972717285, -6.130350112915039, -5.537323951721191, -4.944297790527344, -4.351272106170654, -3.758246421813965, -3.165220260620117, -2.5721943378448486, -1.97916841506958, -1.3861424922943115, -0.793116569519043, -0.20009064674377441, 0.39293527603149414, 0.9859609603881836, 1.5789871215820312, 2.1720130443573, 2.7650389671325684, 3.358064889907837, 3.9510908126831055, 4.544116973876953, 5.137142658233643, 5.730168342590332, 6.32319450378418, 6.916220664978027, 7.509246349334717, 8.102272033691406, 8.695298194885254, 9.288324356079102, 9.881349563598633, 10.47437572479248, 11.067401885986328]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 8.0, 7.0, 9.0, 15.0, 16.0, 15.0, 17.0, 13.0, 23.0, 29.0, 24.0, 13.0, 34.0, 33.0, 36.0, 34.0, 40.0, 38.0, 43.0, 40.0, 44.0, 40.0, 39.0, 38.0, 36.0, 36.0, 33.0, 34.0, 23.0, 24.0, 23.0, 25.0, 13.0, 12.0, 20.0, 10.0, 8.0, 14.0, 9.0, 10.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.997387886047363, -13.576021194458008, -13.154654502868652, -12.733287811279297, -12.311921119689941, -11.890554428100586, -11.46918773651123, -11.047821044921875, -10.62645435333252, -10.205087661743164, -9.783720970153809, -9.362354278564453, -8.940987586975098, -8.519620895385742, -8.098254203796387, -7.676887512207031, -7.255520820617676, -6.83415412902832, -6.412787437438965, -5.991420745849609, -5.570054054260254, -5.148687362670898, -4.727320671081543, -4.3059539794921875, -3.884587287902832, -3.4632205963134766, -3.041853904724121, -2.6204872131347656, -2.19912052154541, -1.7777538299560547, -1.3563871383666992, -0.9350204467773438, -0.5136528015136719, -0.0922861099243164, 0.32908058166503906, 0.7504472732543945, 1.17181396484375, 1.5931806564331055, 2.014547348022461, 2.4359140396118164, 2.857280731201172, 3.2786474227905273, 3.700014114379883, 4.121380805969238, 4.542747497558594, 4.964114189147949, 5.385480880737305, 5.80684757232666, 6.228214263916016, 6.649580955505371, 7.070947647094727, 7.492314338684082, 7.9136810302734375, 8.335047721862793, 8.756414413452148, 9.177781105041504, 9.59914779663086, 10.020514488220215, 10.44188117980957, 10.863247871398926, 11.284614562988281, 11.705981254577637, 12.127347946166992, 12.548714637756348, 12.970081329345703]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 10.0, 12.0, 10.0, 12.0, 11.0, 12.0, 14.0, 21.0, 19.0, 22.0, 23.0, 24.0, 29.0, 37.0, 44.0, 42.0, 41.0, 56.0, 50.0, 41.0, 36.0, 36.0, 37.0, 36.0, 32.0, 30.0, 31.0, 36.0, 26.0, 19.0, 24.0, 16.0, 22.0, 19.0, 9.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.48046875, -1.432861328125, -1.38525390625, -1.337646484375, -1.2900390625, -1.242431640625, -1.19482421875, -1.147216796875, -1.099609375, -1.052001953125, -1.00439453125, -0.956787109375, -0.9091796875, -0.861572265625, -0.81396484375, -0.766357421875, -0.71875, -0.671142578125, -0.62353515625, -0.575927734375, -0.5283203125, -0.480712890625, -0.43310546875, -0.385498046875, -0.337890625, -0.290283203125, -0.24267578125, -0.195068359375, -0.1474609375, -0.099853515625, -0.05224609375, -0.004638671875, 0.04296875, 0.090576171875, 0.13818359375, 0.185791015625, 0.2333984375, 0.281005859375, 0.32861328125, 0.376220703125, 0.423828125, 0.471435546875, 0.51904296875, 0.566650390625, 0.6142578125, 0.661865234375, 0.70947265625, 0.757080078125, 0.8046875, 0.852294921875, 0.89990234375, 0.947509765625, 0.9951171875, 1.042724609375, 1.09033203125, 1.137939453125, 1.185546875, 1.233154296875, 1.28076171875, 1.328369140625, 1.3759765625, 1.423583984375, 1.47119140625, 1.518798828125, 1.56640625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 4.0, 2.0, 1.0, 7.0, 12.0, 24.0, 36.0, 53.0, 53.0, 81.0, 104.0, 204.0, 262.0, 357.0, 471.0, 791.0, 1041.0, 1410.0, 2155.0, 2995.0, 4470.0, 6467.0, 9337.0, 13712.0, 19804.0, 30293.0, 47804.0, 79826.0, 151319.0, 284248.0, 160944.0, 82863.0, 49716.0, 31570.0, 21018.0, 14095.0, 9522.0, 6596.0, 4553.0, 3095.0, 2191.0, 1494.0, 1028.0, 774.0, 527.0, 354.0, 263.0, 202.0, 135.0, 86.0, 46.0, 51.0, 37.0, 24.0, 12.0, 7.0, 3.0, 7.0, 3.0, 3.0, 1.0, 3.0], "bins": [-0.251220703125, -0.243255615234375, -0.23529052734375, -0.227325439453125, -0.2193603515625, -0.211395263671875, -0.20343017578125, -0.195465087890625, -0.1875, -0.179534912109375, -0.17156982421875, -0.163604736328125, -0.1556396484375, -0.147674560546875, -0.13970947265625, -0.131744384765625, -0.123779296875, -0.115814208984375, -0.10784912109375, -0.099884033203125, -0.0919189453125, -0.083953857421875, -0.07598876953125, -0.068023681640625, -0.06005859375, -0.052093505859375, -0.04412841796875, -0.036163330078125, -0.0281982421875, -0.020233154296875, -0.01226806640625, -0.004302978515625, 0.003662109375, 0.011627197265625, 0.01959228515625, 0.027557373046875, 0.0355224609375, 0.043487548828125, 0.05145263671875, 0.059417724609375, 0.0673828125, 0.075347900390625, 0.08331298828125, 0.091278076171875, 0.0992431640625, 0.107208251953125, 0.11517333984375, 0.123138427734375, 0.131103515625, 0.139068603515625, 0.14703369140625, 0.154998779296875, 0.1629638671875, 0.170928955078125, 0.17889404296875, 0.186859130859375, 0.19482421875, 0.202789306640625, 0.21075439453125, 0.218719482421875, 0.2266845703125, 0.234649658203125, 0.24261474609375, 0.250579833984375, 0.258544921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 8.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 11.0, 11.0, 13.0, 12.0, 10.0, 20.0, 36.0, 21.0, 28.0, 34.0, 31.0, 34.0, 41.0, 38.0, 35.0, 31.0, 40.0, 45.0, 1062.0, 30.0, 29.0, 36.0, 35.0, 26.0, 25.0, 30.0, 34.0, 27.0, 33.0, 20.0, 18.0, 16.0, 19.0, 13.0, 10.0, 5.0, 7.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8505859375, -0.821502685546875, -0.79241943359375, -0.763336181640625, -0.7342529296875, -0.705169677734375, -0.67608642578125, -0.647003173828125, -0.617919921875, -0.588836669921875, -0.55975341796875, -0.530670166015625, -0.5015869140625, -0.472503662109375, -0.44342041015625, -0.414337158203125, -0.38525390625, -0.356170654296875, -0.32708740234375, -0.298004150390625, -0.2689208984375, -0.239837646484375, -0.21075439453125, -0.181671142578125, -0.152587890625, -0.123504638671875, -0.09442138671875, -0.065338134765625, -0.0362548828125, -0.007171630859375, 0.02191162109375, 0.050994873046875, 0.080078125, 0.109161376953125, 0.13824462890625, 0.167327880859375, 0.1964111328125, 0.225494384765625, 0.25457763671875, 0.283660888671875, 0.312744140625, 0.341827392578125, 0.37091064453125, 0.399993896484375, 0.4290771484375, 0.458160400390625, 0.48724365234375, 0.516326904296875, 0.54541015625, 0.574493408203125, 0.60357666015625, 0.632659912109375, 0.6617431640625, 0.690826416015625, 0.71990966796875, 0.748992919921875, 0.778076171875, 0.807159423828125, 0.83624267578125, 0.865325927734375, 0.8944091796875, 0.923492431640625, 0.95257568359375, 0.981658935546875, 1.0107421875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 9.0, 9.0, 13.0, 17.0, 31.0, 51.0, 81.0, 122.0, 211.0, 275.0, 388.0, 597.0, 874.0, 1207.0, 1760.0, 2634.0, 3800.0, 5842.0, 8817.0, 13471.0, 20994.0, 32780.0, 54578.0, 94291.0, 186839.0, 1331382.0, 136924.0, 75695.0, 44536.0, 27501.0, 17494.0, 11323.0, 7310.0, 4874.0, 3359.0, 2299.0, 1469.0, 1062.0, 763.0, 459.0, 345.0, 195.0, 164.0, 105.0, 59.0, 49.0, 31.0, 17.0, 14.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24951171875, -0.24127578735351562, -0.23303985595703125, -0.22480392456054688, -0.2165679931640625, -0.20833206176757812, -0.20009613037109375, -0.19186019897460938, -0.183624267578125, -0.17538833618164062, -0.16715240478515625, -0.15891647338867188, -0.1506805419921875, -0.14244461059570312, -0.13420867919921875, -0.12597274780273438, -0.11773681640625, -0.10950088500976562, -0.10126495361328125, -0.09302902221679688, -0.0847930908203125, -0.07655715942382812, -0.06832122802734375, -0.060085296630859375, -0.051849365234375, -0.043613433837890625, -0.03537750244140625, -0.027141571044921875, -0.0189056396484375, -0.010669708251953125, -0.00243377685546875, 0.005802154541015625, 0.0140380859375, 0.022274017333984375, 0.03050994873046875, 0.038745880126953125, 0.0469818115234375, 0.055217742919921875, 0.06345367431640625, 0.07168960571289062, 0.079925537109375, 0.08816146850585938, 0.09639739990234375, 0.10463333129882812, 0.1128692626953125, 0.12110519409179688, 0.12934112548828125, 0.13757705688476562, 0.14581298828125, 0.15404891967773438, 0.16228485107421875, 0.17052078247070312, 0.1787567138671875, 0.18699264526367188, 0.19522857666015625, 0.20346450805664062, 0.211700439453125, 0.21993637084960938, 0.22817230224609375, 0.23640823364257812, 0.2446441650390625, 0.2528800964355469, 0.26111602783203125, 0.2693519592285156, 0.277587890625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 7.0, 11.0, 11.0, 11.0, 10.0, 19.0, 14.0, 30.0, 31.0, 36.0, 53.0, 42.0, 37.0, 48.0, 63.0, 49.0, 46.0, 41.0, 39.0, 46.0, 49.0, 46.0, 37.0, 36.0, 29.0, 25.0, 18.0, 17.0, 18.0, 13.0, 12.0, 8.0, 9.0, 9.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.00016367435455322266, -0.00015834160149097443, -0.0001530088484287262, -0.00014767609536647797, -0.00014234334230422974, -0.0001370105892419815, -0.00013167783617973328, -0.00012634508311748505, -0.00012101233005523682, -0.00011567957699298859, -0.00011034682393074036, -0.00010501407086849213, -9.96813178062439e-05, -9.434856474399567e-05, -8.901581168174744e-05, -8.36830586194992e-05, -7.835030555725098e-05, -7.301755249500275e-05, -6.768479943275452e-05, -6.235204637050629e-05, -5.701929330825806e-05, -5.168654024600983e-05, -4.63537871837616e-05, -4.102103412151337e-05, -3.568828105926514e-05, -3.0355527997016907e-05, -2.5022774934768677e-05, -1.9690021872520447e-05, -1.4357268810272217e-05, -9.024515748023987e-06, -3.691762685775757e-06, 1.6409903764724731e-06, 6.973743438720703e-06, 1.2306496500968933e-05, 1.7639249563217163e-05, 2.2972002625465393e-05, 2.8304755687713623e-05, 3.363750874996185e-05, 3.897026181221008e-05, 4.430301487445831e-05, 4.963576793670654e-05, 5.496852099895477e-05, 6.0301274061203e-05, 6.563402712345123e-05, 7.096678018569946e-05, 7.629953324794769e-05, 8.163228631019592e-05, 8.696503937244415e-05, 9.229779243469238e-05, 9.763054549694061e-05, 0.00010296329855918884, 0.00010829605162143707, 0.0001136288046836853, 0.00011896155774593353, 0.00012429431080818176, 0.00012962706387043, 0.00013495981693267822, 0.00014029256999492645, 0.00014562532305717468, 0.0001509580761194229, 0.00015629082918167114, 0.00016162358224391937, 0.0001669563353061676, 0.00017228908836841583, 0.00017762184143066406]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 11.0, 9.0, 12.0, 23.0, 18.0, 25.0, 41.0, 45.0, 57.0, 71.0, 106.0, 109.0, 167.0, 275.0, 324.0, 613.0, 3339.0, 942681.0, 97947.0, 1150.0, 443.0, 254.0, 208.0, 116.0, 120.0, 93.0, 86.0, 54.0, 34.0, 31.0, 11.0, 13.0, 17.0, 10.0, 7.0, 7.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0031909942626953125, -0.00308382511138916, -0.002976655960083008, -0.0028694868087768555, -0.002762317657470703, -0.0026551485061645508, -0.0025479793548583984, -0.002440810203552246, -0.0023336410522460938, -0.0022264719009399414, -0.002119302749633789, -0.0020121335983276367, -0.0019049644470214844, -0.001797795295715332, -0.0016906261444091797, -0.0015834569931030273, -0.001476287841796875, -0.0013691186904907227, -0.0012619495391845703, -0.001154780387878418, -0.0010476112365722656, -0.0009404420852661133, -0.0008332729339599609, -0.0007261037826538086, -0.0006189346313476562, -0.0005117654800415039, -0.00040459632873535156, -0.0002974271774291992, -0.00019025802612304688, -8.308887481689453e-05, 2.4080276489257812e-05, 0.00013124942779541016, 0.0002384185791015625, 0.00034558773040771484, 0.0004527568817138672, 0.0005599260330200195, 0.0006670951843261719, 0.0007742643356323242, 0.0008814334869384766, 0.000988602638244629, 0.0010957717895507812, 0.0012029409408569336, 0.001310110092163086, 0.0014172792434692383, 0.0015244483947753906, 0.001631617546081543, 0.0017387866973876953, 0.0018459558486938477, 0.001953125, 0.0020602941513061523, 0.0021674633026123047, 0.002274632453918457, 0.0023818016052246094, 0.0024889707565307617, 0.002596139907836914, 0.0027033090591430664, 0.0028104782104492188, 0.002917647361755371, 0.0030248165130615234, 0.0031319856643676758, 0.003239154815673828, 0.0033463239669799805, 0.003453493118286133, 0.003560662269592285, 0.0036678314208984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 119.0, 523.0, 309.0, 49.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010006871307268739, -0.000982757075689733, -0.0009648269042372704, -0.0009468968492001295, -0.0009289667359553277, -0.000911036622710526, -0.0008931065676733851, -0.0008751764544285834, -0.0008572463411837816, -0.0008393162279389799, -0.0008213861146941781, -0.0008034560596570373, -0.0007855259464122355, -0.0007675958331674337, -0.0007496657781302929, -0.0007317356648854911, -0.0007138055516406894, -0.0006958754383958876, -0.0006779453251510859, -0.000660015270113945, -0.0006420851568691432, -0.0006241550436243415, -0.0006062249885872006, -0.0005882948753423989, -0.0005703647620975971, -0.0005524346488527954, -0.0005345045356079936, -0.0005165744805708528, -0.000498644367326051, -0.00048071425408124924, -0.00046278416994027793, -0.00044485408579930663, -0.00042692391434684396, -0.0004089938011020422, -0.0003910637169610709, -0.0003731336328200996, -0.00035520351957529783, -0.00033727340633049607, -0.00031934332218952477, -0.00030141323804855347, -0.0002834831248037517, -0.00026555301155894995, -0.00024762292741797864, -0.0002296928287250921, -0.00021176273003220558, -0.00019383263133931905, -0.00017590253264643252, -0.000157972433953546, -0.00014004234981257468, -0.00012211225111968815, -0.00010418215242680162, -8.625205373391509e-05, -6.832195504102856e-05, -5.039185634814203e-05, -3.2461757655255497e-05, -1.4531658962368965e-05, 3.398439730517566e-06, 2.1328538423404098e-05, 3.925863711629063e-05, 5.718873580917716e-05, 7.511883450206369e-05, 9.304893319495022e-05, 0.00011097903188783675, 0.00012890913058072329, 0.00014683922927360982]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 12.0, 12.0, 11.0, 14.0, 19.0, 19.0, 23.0, 41.0, 20.0, 22.0, 32.0, 35.0, 29.0, 38.0, 35.0, 50.0, 45.0, 35.0, 48.0, 44.0, 42.0, 37.0, 37.0, 41.0, 33.0, 20.0, 27.0, 26.0, 24.0, 19.0, 19.0, 19.0, 10.0, 1.0, 14.0, 8.0, 2.0, 5.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0], "bins": [-0.00011289119720458984, -0.00010976940393447876, -0.00010664761066436768, -0.00010352581739425659, -0.00010040402412414551, -9.728223085403442e-05, -9.416043758392334e-05, -9.103864431381226e-05, -8.791685104370117e-05, -8.479505777359009e-05, -8.1673264503479e-05, -7.855147123336792e-05, -7.542967796325684e-05, -7.230788469314575e-05, -6.918609142303467e-05, -6.606429815292358e-05, -6.29425048828125e-05, -5.9820711612701416e-05, -5.669891834259033e-05, -5.357712507247925e-05, -5.0455331802368164e-05, -4.733353853225708e-05, -4.4211745262145996e-05, -4.108995199203491e-05, -3.796815872192383e-05, -3.4846365451812744e-05, -3.172457218170166e-05, -2.8602778911590576e-05, -2.5480985641479492e-05, -2.2359192371368408e-05, -1.9237399101257324e-05, -1.611560583114624e-05, -1.2993812561035156e-05, -9.872019290924072e-06, -6.750226020812988e-06, -3.6284327507019043e-06, -5.066394805908203e-07, 2.6151537895202637e-06, 5.736947059631348e-06, 8.858740329742432e-06, 1.1980533599853516e-05, 1.51023268699646e-05, 1.8224120140075684e-05, 2.1345913410186768e-05, 2.446770668029785e-05, 2.7589499950408936e-05, 3.071129322052002e-05, 3.3833086490631104e-05, 3.695487976074219e-05, 4.007667303085327e-05, 4.3198466300964355e-05, 4.632025957107544e-05, 4.9442052841186523e-05, 5.256384611129761e-05, 5.568563938140869e-05, 5.8807432651519775e-05, 6.192922592163086e-05, 6.505101919174194e-05, 6.817281246185303e-05, 7.129460573196411e-05, 7.44163990020752e-05, 7.753819227218628e-05, 8.065998554229736e-05, 8.378177881240845e-05, 8.690357208251953e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 10.0, 12.0, 10.0, 12.0, 11.0, 12.0, 14.0, 21.0, 19.0, 22.0, 23.0, 24.0, 29.0, 37.0, 44.0, 42.0, 41.0, 56.0, 50.0, 41.0, 36.0, 36.0, 37.0, 36.0, 32.0, 30.0, 31.0, 36.0, 26.0, 19.0, 24.0, 16.0, 22.0, 19.0, 9.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.48046875, -1.432861328125, -1.38525390625, -1.337646484375, -1.2900390625, -1.242431640625, -1.19482421875, -1.147216796875, -1.099609375, -1.052001953125, -1.00439453125, -0.956787109375, -0.9091796875, -0.861572265625, -0.81396484375, -0.766357421875, -0.71875, -0.671142578125, -0.62353515625, -0.575927734375, -0.5283203125, -0.480712890625, -0.43310546875, -0.385498046875, -0.337890625, -0.290283203125, -0.24267578125, -0.195068359375, -0.1474609375, -0.099853515625, -0.05224609375, -0.004638671875, 0.04296875, 0.090576171875, 0.13818359375, 0.185791015625, 0.2333984375, 0.281005859375, 0.32861328125, 0.376220703125, 0.423828125, 0.471435546875, 0.51904296875, 0.566650390625, 0.6142578125, 0.661865234375, 0.70947265625, 0.757080078125, 0.8046875, 0.852294921875, 0.89990234375, 0.947509765625, 0.9951171875, 1.042724609375, 1.09033203125, 1.137939453125, 1.185546875, 1.233154296875, 1.28076171875, 1.328369140625, 1.3759765625, 1.423583984375, 1.47119140625, 1.518798828125, 1.56640625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 7.0, 5.0, 12.0, 10.0, 16.0, 30.0, 32.0, 38.0, 55.0, 95.0, 98.0, 154.0, 207.0, 337.0, 478.0, 789.0, 1611.0, 3246.0, 7989.0, 24446.0, 97705.0, 381692.0, 389632.0, 99418.0, 25117.0, 8116.0, 3231.0, 1514.0, 829.0, 556.0, 324.0, 200.0, 162.0, 111.0, 74.0, 61.0, 36.0, 35.0, 21.0, 22.0, 12.0, 8.0, 7.0, 4.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.044921875, -1.976776123046875, -1.90863037109375, -1.840484619140625, -1.7723388671875, -1.704193115234375, -1.63604736328125, -1.567901611328125, -1.499755859375, -1.431610107421875, -1.36346435546875, -1.295318603515625, -1.2271728515625, -1.159027099609375, -1.09088134765625, -1.022735595703125, -0.95458984375, -0.886444091796875, -0.81829833984375, -0.750152587890625, -0.6820068359375, -0.613861083984375, -0.54571533203125, -0.477569580078125, -0.409423828125, -0.341278076171875, -0.27313232421875, -0.204986572265625, -0.1368408203125, -0.068695068359375, -0.00054931640625, 0.067596435546875, 0.1357421875, 0.203887939453125, 0.27203369140625, 0.340179443359375, 0.4083251953125, 0.476470947265625, 0.54461669921875, 0.612762451171875, 0.680908203125, 0.749053955078125, 0.81719970703125, 0.885345458984375, 0.9534912109375, 1.021636962890625, 1.08978271484375, 1.157928466796875, 1.22607421875, 1.294219970703125, 1.36236572265625, 1.430511474609375, 1.4986572265625, 1.566802978515625, 1.63494873046875, 1.703094482421875, 1.771240234375, 1.839385986328125, 1.90753173828125, 1.975677490234375, 2.0438232421875, 2.111968994140625, 2.18011474609375, 2.248260498046875, 2.31640625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 6.0, 5.0, 11.0, 13.0, 11.0, 12.0, 12.0, 16.0, 28.0, 23.0, 24.0, 27.0, 34.0, 27.0, 40.0, 35.0, 60.0, 83.0, 112.0, 338.0, 1463.0, 152.0, 80.0, 58.0, 48.0, 52.0, 34.0, 34.0, 21.0, 18.0, 27.0, 19.0, 17.0, 18.0, 15.0, 11.0, 8.0, 10.0, 11.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -4.99981689453125, -4.8394775390625, -4.67913818359375, -4.518798828125, -4.35845947265625, -4.1981201171875, -4.03778076171875, -3.87744140625, -3.71710205078125, -3.5567626953125, -3.39642333984375, -3.236083984375, -3.07574462890625, -2.9154052734375, -2.75506591796875, -2.5947265625, -2.43438720703125, -2.2740478515625, -2.11370849609375, -1.953369140625, -1.79302978515625, -1.6326904296875, -1.47235107421875, -1.31201171875, -1.15167236328125, -0.9913330078125, -0.83099365234375, -0.670654296875, -0.51031494140625, -0.3499755859375, -0.18963623046875, -0.029296875, 0.13104248046875, 0.2913818359375, 0.45172119140625, 0.612060546875, 0.77239990234375, 0.9327392578125, 1.09307861328125, 1.25341796875, 1.41375732421875, 1.5740966796875, 1.73443603515625, 1.894775390625, 2.05511474609375, 2.2154541015625, 2.37579345703125, 2.5361328125, 2.69647216796875, 2.8568115234375, 3.01715087890625, 3.177490234375, 3.33782958984375, 3.4981689453125, 3.65850830078125, 3.81884765625, 3.97918701171875, 4.1395263671875, 4.29986572265625, 4.460205078125, 4.62054443359375, 4.7808837890625, 4.94122314453125, 5.1015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 11.0, 8.0, 6.0, 17.0, 19.0, 27.0, 33.0, 41.0, 54.0, 63.0, 87.0, 154.0, 301.0, 705.0, 3112.0, 73598.0, 3022724.0, 40903.0, 2447.0, 592.0, 270.0, 168.0, 82.0, 66.0, 56.0, 34.0, 27.0, 18.0, 24.0, 20.0, 8.0, 6.0, 7.0, 12.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.72900390625, -10.3876953125, -10.04638671875, -9.705078125, -9.36376953125, -9.0224609375, -8.68115234375, -8.33984375, -7.99853515625, -7.6572265625, -7.31591796875, -6.974609375, -6.63330078125, -6.2919921875, -5.95068359375, -5.609375, -5.26806640625, -4.9267578125, -4.58544921875, -4.244140625, -3.90283203125, -3.5615234375, -3.22021484375, -2.87890625, -2.53759765625, -2.1962890625, -1.85498046875, -1.513671875, -1.17236328125, -0.8310546875, -0.48974609375, -0.1484375, 0.19287109375, 0.5341796875, 0.87548828125, 1.216796875, 1.55810546875, 1.8994140625, 2.24072265625, 2.58203125, 2.92333984375, 3.2646484375, 3.60595703125, 3.947265625, 4.28857421875, 4.6298828125, 4.97119140625, 5.3125, 5.65380859375, 5.9951171875, 6.33642578125, 6.677734375, 7.01904296875, 7.3603515625, 7.70166015625, 8.04296875, 8.38427734375, 8.7255859375, 9.06689453125, 9.408203125, 9.74951171875, 10.0908203125, 10.43212890625, 10.7734375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [16.0, 441.0, 548.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.105020523071289, -2.1163346767425537, -0.12764883041381836, 1.861037254333496, 3.8497228622436523, 5.838408470153809, 7.827095031738281, 9.815780639648438, 11.804466247558594, 13.79315185546875, 15.781837463378906, 17.770523071289062, 19.75920867919922, 21.747894287109375, 23.736581802368164, 25.72526741027832, 27.713953018188477, 29.702638626098633, 31.69132423400879, 33.68001174926758, 35.668697357177734, 37.65738296508789, 39.64606857299805, 41.6347541809082, 43.62343978881836, 45.612125396728516, 47.60081100463867, 49.58949661254883, 51.578182220458984, 53.56686782836914, 55.55555725097656, 57.54424285888672, 59.532928466796875, 61.52161407470703, 63.51029968261719, 65.49898529052734, 67.4876708984375, 69.47635650634766, 71.46504211425781, 73.45372772216797, 75.44241333007812, 77.43109893798828, 79.41978454589844, 81.4084701538086, 83.39715576171875, 85.3858413696289, 87.37452697753906, 89.36321258544922, 91.35189819335938, 93.34058380126953, 95.32926940917969, 97.31795501708984, 99.306640625, 101.29532623291016, 103.28401184082031, 105.27269744873047, 107.26139068603516, 109.25007629394531, 111.23876190185547, 113.22744750976562, 115.21613311767578, 117.20481872558594, 119.1935043334961, 121.18218994140625, 123.1708755493164]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 8.0, 9.0, 8.0, 11.0, 11.0, 17.0, 20.0, 20.0, 21.0, 26.0, 26.0, 28.0, 27.0, 24.0, 21.0, 36.0, 26.0, 42.0, 37.0, 39.0, 38.0, 29.0, 41.0, 48.0, 38.0, 29.0, 35.0, 32.0, 27.0, 30.0, 31.0, 23.0, 11.0, 15.0, 19.0, 13.0, 19.0, 13.0, 13.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.06462860107422, -15.56001091003418, -15.05539321899414, -14.550775527954102, -14.046157836914062, -13.541540145874023, -13.036921501159668, -12.532303810119629, -12.02768611907959, -11.52306842803955, -11.018450736999512, -10.513833045959473, -10.009214401245117, -9.504596710205078, -8.999979019165039, -8.495361328125, -7.990743637084961, -7.486125946044922, -6.981508255004883, -6.4768900871276855, -5.9722723960876465, -5.467654705047607, -4.96303653717041, -4.458418846130371, -3.953801155090332, -3.449183464050293, -2.944565534591675, -2.4399476051330566, -1.9353299140930176, -1.4307122230529785, -0.9260942935943604, -0.4214763641357422, 0.08314132690429688, 0.5877591371536255, 1.092376947402954, 1.5969947576522827, 2.1016125679016113, 2.6062302589416504, 3.1108481884002686, 3.6154661178588867, 4.120083808898926, 4.624701499938965, 5.129319190979004, 5.633937358856201, 6.13855504989624, 6.643172740936279, 7.147790908813477, 7.652408599853516, 8.157026290893555, 8.661643981933594, 9.166261672973633, 9.670879364013672, 10.175497055053711, 10.68011474609375, 11.184733390808105, 11.689351081848145, 12.193968772888184, 12.698586463928223, 13.203204154968262, 13.7078218460083, 14.212440490722656, 14.717058181762695, 15.221675872802734, 15.726293563842773, 16.230911254882812]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 8.0, 10.0, 10.0, 9.0, 12.0, 9.0, 14.0, 12.0, 18.0, 21.0, 18.0, 10.0, 20.0, 33.0, 21.0, 42.0, 32.0, 46.0, 41.0, 56.0, 50.0, 38.0, 44.0, 34.0, 43.0, 38.0, 29.0, 22.0, 35.0, 27.0, 31.0, 24.0, 30.0, 26.0, 14.0, 25.0, 7.0, 7.0, 9.0, 4.0, 1.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5673828125, -1.5173492431640625, -1.467315673828125, -1.4172821044921875, -1.36724853515625, -1.3172149658203125, -1.267181396484375, -1.2171478271484375, -1.1671142578125, -1.1170806884765625, -1.067047119140625, -1.0170135498046875, -0.96697998046875, -0.9169464111328125, -0.866912841796875, -0.8168792724609375, -0.766845703125, -0.7168121337890625, -0.666778564453125, -0.6167449951171875, -0.56671142578125, -0.5166778564453125, -0.466644287109375, -0.4166107177734375, -0.3665771484375, -0.3165435791015625, -0.266510009765625, -0.2164764404296875, -0.16644287109375, -0.1164093017578125, -0.066375732421875, -0.0163421630859375, 0.03369140625, 0.0837249755859375, 0.133758544921875, 0.1837921142578125, 0.23382568359375, 0.2838592529296875, 0.333892822265625, 0.3839263916015625, 0.4339599609375, 0.4839935302734375, 0.534027099609375, 0.5840606689453125, 0.63409423828125, 0.6841278076171875, 0.734161376953125, 0.7841949462890625, 0.834228515625, 0.8842620849609375, 0.934295654296875, 0.9843292236328125, 1.03436279296875, 1.0843963623046875, 1.134429931640625, 1.1844635009765625, 1.2344970703125, 1.2845306396484375, 1.334564208984375, 1.3845977783203125, 1.43463134765625, 1.4846649169921875, 1.534698486328125, 1.5847320556640625, 1.634765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 6.0, 6.0, 14.0, 8.0, 8.0, 19.0, 22.0, 17.0, 22.0, 44.0, 70.0, 116.0, 179.0, 371.0, 833.0, 2289.0, 7603.0, 33281.0, 211460.0, 1460883.0, 2016106.0, 389176.0, 54733.0, 11623.0, 3252.0, 1105.0, 433.0, 203.0, 115.0, 82.0, 52.0, 41.0, 25.0, 13.0, 19.0, 12.0, 5.0, 8.0, 11.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.376953125, -3.264923095703125, -3.15289306640625, -3.040863037109375, -2.9288330078125, -2.816802978515625, -2.70477294921875, -2.592742919921875, -2.480712890625, -2.368682861328125, -2.25665283203125, -2.144622802734375, -2.0325927734375, -1.920562744140625, -1.80853271484375, -1.696502685546875, -1.58447265625, -1.472442626953125, -1.36041259765625, -1.248382568359375, -1.1363525390625, -1.024322509765625, -0.91229248046875, -0.800262451171875, -0.688232421875, -0.576202392578125, -0.46417236328125, -0.352142333984375, -0.2401123046875, -0.128082275390625, -0.01605224609375, 0.095977783203125, 0.2080078125, 0.320037841796875, 0.43206787109375, 0.544097900390625, 0.6561279296875, 0.768157958984375, 0.88018798828125, 0.992218017578125, 1.104248046875, 1.216278076171875, 1.32830810546875, 1.440338134765625, 1.5523681640625, 1.664398193359375, 1.77642822265625, 1.888458251953125, 2.00048828125, 2.112518310546875, 2.22454833984375, 2.336578369140625, 2.4486083984375, 2.560638427734375, 2.67266845703125, 2.784698486328125, 2.896728515625, 3.008758544921875, 3.12078857421875, 3.232818603515625, 3.3448486328125, 3.456878662109375, 3.56890869140625, 3.680938720703125, 3.79296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 7.0, 17.0, 11.0, 15.0, 31.0, 39.0, 40.0, 70.0, 73.0, 119.0, 142.0, 190.0, 265.0, 301.0, 405.0, 389.0, 419.0, 306.0, 286.0, 223.0, 154.0, 135.0, 97.0, 87.0, 53.0, 55.0, 28.0, 26.0, 20.0, 10.0, 10.0, 12.0, 5.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7578125, -3.63153076171875, -3.5052490234375, -3.37896728515625, -3.252685546875, -3.12640380859375, -3.0001220703125, -2.87384033203125, -2.74755859375, -2.62127685546875, -2.4949951171875, -2.36871337890625, -2.242431640625, -2.11614990234375, -1.9898681640625, -1.86358642578125, -1.7373046875, -1.61102294921875, -1.4847412109375, -1.35845947265625, -1.232177734375, -1.10589599609375, -0.9796142578125, -0.85333251953125, -0.72705078125, -0.60076904296875, -0.4744873046875, -0.34820556640625, -0.221923828125, -0.09564208984375, 0.0306396484375, 0.15692138671875, 0.283203125, 0.40948486328125, 0.5357666015625, 0.66204833984375, 0.788330078125, 0.91461181640625, 1.0408935546875, 1.16717529296875, 1.29345703125, 1.41973876953125, 1.5460205078125, 1.67230224609375, 1.798583984375, 1.92486572265625, 2.0511474609375, 2.17742919921875, 2.3037109375, 2.42999267578125, 2.5562744140625, 2.68255615234375, 2.808837890625, 2.93511962890625, 3.0614013671875, 3.18768310546875, 3.31396484375, 3.44024658203125, 3.5665283203125, 3.69281005859375, 3.819091796875, 3.94537353515625, 4.0716552734375, 4.19793701171875, 4.32421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 10.0, 12.0, 23.0, 35.0, 55.0, 97.0, 172.0, 478.0, 2740.0, 153447.0, 3952261.0, 82074.0, 2082.0, 415.0, 165.0, 99.0, 50.0, 20.0, 22.0, 8.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.53125, -23.9532470703125, -23.375244140625, -22.7972412109375, -22.21923828125, -21.6412353515625, -21.063232421875, -20.4852294921875, -19.9072265625, -19.3292236328125, -18.751220703125, -18.1732177734375, -17.59521484375, -17.0172119140625, -16.439208984375, -15.8612060546875, -15.283203125, -14.7052001953125, -14.127197265625, -13.5491943359375, -12.97119140625, -12.3931884765625, -11.815185546875, -11.2371826171875, -10.6591796875, -10.0811767578125, -9.503173828125, -8.9251708984375, -8.34716796875, -7.7691650390625, -7.191162109375, -6.6131591796875, -6.03515625, -5.4571533203125, -4.879150390625, -4.3011474609375, -3.72314453125, -3.1451416015625, -2.567138671875, -1.9891357421875, -1.4111328125, -0.8331298828125, -0.255126953125, 0.3228759765625, 0.90087890625, 1.4788818359375, 2.056884765625, 2.6348876953125, 3.212890625, 3.7908935546875, 4.368896484375, 4.9468994140625, 5.52490234375, 6.1029052734375, 6.680908203125, 7.2589111328125, 7.8369140625, 8.4149169921875, 8.992919921875, 9.5709228515625, 10.14892578125, 10.7269287109375, 11.304931640625, 11.8829345703125, 12.4609375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 14.0, 42.0, 75.0, 109.0, 184.0, 195.0, 167.0, 115.0, 57.0, 30.0, 12.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.153446197509766, -42.1279411315918, -41.102439880371094, -40.076934814453125, -39.051429748535156, -38.02592468261719, -37.00041961669922, -35.974918365478516, -34.94941329956055, -33.92390823364258, -32.898406982421875, -31.872901916503906, -30.847396850585938, -29.82189178466797, -28.796388626098633, -27.770885467529297, -26.745380401611328, -25.71987533569336, -24.694372177124023, -23.668869018554688, -22.64336395263672, -21.61785888671875, -20.592355728149414, -19.566852569580078, -18.54134750366211, -17.51584243774414, -16.490339279174805, -15.464835166931152, -14.4393310546875, -13.413826942443848, -12.388322830200195, -11.362818717956543, -10.33731460571289, -9.311810493469238, -8.286306381225586, -7.260802268981934, -6.235298156738281, -5.209794044494629, -4.184289932250977, -3.158785820007324, -2.133281707763672, -1.1077775955200195, -0.08227348327636719, 0.9432306289672852, 1.9687347412109375, 2.99423885345459, 4.019742965698242, 5.0452470779418945, 6.070751190185547, 7.096255302429199, 8.121759414672852, 9.147263526916504, 10.172767639160156, 11.198271751403809, 12.223775863647461, 13.249279975891113, 14.274784088134766, 15.300288200378418, 16.32579231262207, 17.351295471191406, 18.376800537109375, 19.402305603027344, 20.42780876159668, 21.453311920166016, 22.478816986083984]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 7.0, 10.0, 9.0, 15.0, 11.0, 18.0, 25.0, 18.0, 24.0, 23.0, 36.0, 29.0, 26.0, 24.0, 31.0, 44.0, 28.0, 33.0, 30.0, 36.0, 42.0, 41.0, 39.0, 45.0, 31.0, 42.0, 33.0, 29.0, 29.0, 21.0, 28.0, 27.0, 16.0, 18.0, 18.0, 17.0, 8.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.86210823059082, -12.397945404052734, -11.933783531188965, -11.469621658325195, -11.00545883178711, -10.541296005249023, -10.077134132385254, -9.612972259521484, -9.148809432983398, -8.684646606445312, -8.220484733581543, -7.756322383880615, -7.2921600341796875, -6.82799768447876, -6.363835334777832, -5.899672985076904, -5.435510635375977, -4.971348285675049, -4.507185935974121, -4.043023586273193, -3.5788612365722656, -3.114698886871338, -2.65053653717041, -2.1863741874694824, -1.7222118377685547, -1.258049488067627, -0.7938871383666992, -0.3297247886657715, 0.13443756103515625, 0.598599910736084, 1.0627622604370117, 1.5269246101379395, 1.9910869598388672, 2.455249309539795, 2.9194116592407227, 3.3835740089416504, 3.847736358642578, 4.311898708343506, 4.776061058044434, 5.240223407745361, 5.704385757446289, 6.168548107147217, 6.6327104568481445, 7.096872806549072, 7.56103515625, 8.025197982788086, 8.489359855651855, 8.953521728515625, 9.417684555053711, 9.881847381591797, 10.346009254455566, 10.810171127319336, 11.274333953857422, 11.738496780395508, 12.202658653259277, 12.666820526123047, 13.130983352661133, 13.595146179199219, 14.059308052062988, 14.523469924926758, 14.987632751464844, 15.45179557800293, 15.9159574508667, 16.38011932373047, 16.844282150268555]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 5.0, 11.0, 7.0, 10.0, 10.0, 16.0, 12.0, 15.0, 15.0, 18.0, 11.0, 22.0, 33.0, 27.0, 34.0, 41.0, 36.0, 32.0, 40.0, 52.0, 35.0, 39.0, 30.0, 36.0, 42.0, 40.0, 40.0, 28.0, 34.0, 22.0, 23.0, 26.0, 21.0, 25.0, 19.0, 15.0, 9.0, 12.0, 8.0, 7.0, 4.0, 4.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.669921875, -1.621978759765625, -1.57403564453125, -1.526092529296875, -1.4781494140625, -1.430206298828125, -1.38226318359375, -1.334320068359375, -1.286376953125, -1.238433837890625, -1.19049072265625, -1.142547607421875, -1.0946044921875, -1.046661376953125, -0.99871826171875, -0.950775146484375, -0.90283203125, -0.854888916015625, -0.80694580078125, -0.759002685546875, -0.7110595703125, -0.663116455078125, -0.61517333984375, -0.567230224609375, -0.519287109375, -0.471343994140625, -0.42340087890625, -0.375457763671875, -0.3275146484375, -0.279571533203125, -0.23162841796875, -0.183685302734375, -0.1357421875, -0.087799072265625, -0.03985595703125, 0.008087158203125, 0.0560302734375, 0.103973388671875, 0.15191650390625, 0.199859619140625, 0.247802734375, 0.295745849609375, 0.34368896484375, 0.391632080078125, 0.4395751953125, 0.487518310546875, 0.53546142578125, 0.583404541015625, 0.63134765625, 0.679290771484375, 0.72723388671875, 0.775177001953125, 0.8231201171875, 0.871063232421875, 0.91900634765625, 0.966949462890625, 1.014892578125, 1.062835693359375, 1.11077880859375, 1.158721923828125, 1.2066650390625, 1.254608154296875, 1.30255126953125, 1.350494384765625, 1.3984375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 15.0, 9.0, 16.0, 29.0, 46.0, 53.0, 113.0, 162.0, 219.0, 289.0, 438.0, 569.0, 797.0, 1077.0, 1569.0, 2122.0, 2902.0, 4109.0, 5914.0, 8265.0, 11448.0, 16411.0, 23927.0, 35521.0, 55488.0, 90266.0, 160143.0, 239834.0, 144633.0, 82602.0, 50952.0, 32832.0, 22306.0, 15197.0, 10939.0, 7751.0, 5525.0, 4006.0, 2856.0, 2023.0, 1432.0, 1141.0, 810.0, 513.0, 450.0, 235.0, 197.0, 146.0, 86.0, 57.0, 64.0, 26.0, 17.0, 10.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.24109649658203125, -0.2331695556640625, -0.22524261474609375, -0.217315673828125, -0.20938873291015625, -0.2014617919921875, -0.19353485107421875, -0.18560791015625, -0.17768096923828125, -0.1697540283203125, -0.16182708740234375, -0.153900146484375, -0.14597320556640625, -0.1380462646484375, -0.13011932373046875, -0.1221923828125, -0.11426544189453125, -0.1063385009765625, -0.09841156005859375, -0.090484619140625, -0.08255767822265625, -0.0746307373046875, -0.06670379638671875, -0.05877685546875, -0.05084991455078125, -0.0429229736328125, -0.03499603271484375, -0.027069091796875, -0.01914215087890625, -0.0112152099609375, -0.00328826904296875, 0.004638671875, 0.01256561279296875, 0.0204925537109375, 0.02841949462890625, 0.036346435546875, 0.04427337646484375, 0.0522003173828125, 0.06012725830078125, 0.06805419921875, 0.07598114013671875, 0.0839080810546875, 0.09183502197265625, 0.099761962890625, 0.10768890380859375, 0.1156158447265625, 0.12354278564453125, 0.1314697265625, 0.13939666748046875, 0.1473236083984375, 0.15525054931640625, 0.163177490234375, 0.17110443115234375, 0.1790313720703125, 0.18695831298828125, 0.19488525390625, 0.20281219482421875, 0.2107391357421875, 0.21866607666015625, 0.226593017578125, 0.23451995849609375, 0.2424468994140625, 0.25037384033203125, 0.25830078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 7.0, 10.0, 7.0, 6.0, 11.0, 15.0, 19.0, 20.0, 25.0, 23.0, 33.0, 28.0, 19.0, 31.0, 40.0, 46.0, 31.0, 42.0, 49.0, 1058.0, 35.0, 44.0, 31.0, 52.0, 32.0, 32.0, 32.0, 28.0, 22.0, 21.0, 18.0, 18.0, 20.0, 24.0, 18.0, 14.0, 10.0, 8.0, 10.0, 6.0, 7.0, 1.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.025390625, -0.9940109252929688, -0.9626312255859375, -0.9312515258789062, -0.899871826171875, -0.8684921264648438, -0.8371124267578125, -0.8057327270507812, -0.77435302734375, -0.7429733276367188, -0.7115936279296875, -0.6802139282226562, -0.648834228515625, -0.6174545288085938, -0.5860748291015625, -0.5546951293945312, -0.5233154296875, -0.49193572998046875, -0.4605560302734375, -0.42917633056640625, -0.397796630859375, -0.36641693115234375, -0.3350372314453125, -0.30365753173828125, -0.27227783203125, -0.24089813232421875, -0.2095184326171875, -0.17813873291015625, -0.146759033203125, -0.11537933349609375, -0.0839996337890625, -0.05261993408203125, -0.021240234375, 0.01013946533203125, 0.0415191650390625, 0.07289886474609375, 0.104278564453125, 0.13565826416015625, 0.1670379638671875, 0.19841766357421875, 0.22979736328125, 0.26117706298828125, 0.2925567626953125, 0.32393646240234375, 0.355316162109375, 0.38669586181640625, 0.4180755615234375, 0.44945526123046875, 0.4808349609375, 0.5122146606445312, 0.5435943603515625, 0.5749740600585938, 0.606353759765625, 0.6377334594726562, 0.6691131591796875, 0.7004928588867188, 0.73187255859375, 0.7632522583007812, 0.7946319580078125, 0.8260116577148438, 0.857391357421875, 0.8887710571289062, 0.9201507568359375, 0.9515304565429688, 0.98291015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 9.0, 8.0, 10.0, 15.0, 19.0, 47.0, 53.0, 81.0, 130.0, 216.0, 274.0, 368.0, 621.0, 902.0, 1223.0, 1823.0, 2626.0, 4053.0, 5755.0, 8518.0, 12679.0, 18980.0, 29341.0, 47612.0, 82815.0, 161117.0, 1337754.0, 162145.0, 83089.0, 47815.0, 29637.0, 18921.0, 12262.0, 8278.0, 5640.0, 3751.0, 2665.0, 1791.0, 1293.0, 845.0, 637.0, 427.0, 269.0, 199.0, 145.0, 91.0, 74.0, 37.0, 33.0, 18.0, 9.0, 12.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.27685546875, -0.2683372497558594, -0.25981903076171875, -0.2513008117675781, -0.2427825927734375, -0.23426437377929688, -0.22574615478515625, -0.21722793579101562, -0.208709716796875, -0.20019149780273438, -0.19167327880859375, -0.18315505981445312, -0.1746368408203125, -0.16611862182617188, -0.15760040283203125, -0.14908218383789062, -0.14056396484375, -0.13204574584960938, -0.12352752685546875, -0.11500930786132812, -0.1064910888671875, -0.09797286987304688, -0.08945465087890625, -0.08093643188476562, -0.072418212890625, -0.06389999389648438, -0.05538177490234375, -0.046863555908203125, -0.0383453369140625, -0.029827117919921875, -0.02130889892578125, -0.012790679931640625, -0.0042724609375, 0.004245758056640625, 0.01276397705078125, 0.021282196044921875, 0.0298004150390625, 0.038318634033203125, 0.04683685302734375, 0.055355072021484375, 0.063873291015625, 0.07239151000976562, 0.08090972900390625, 0.08942794799804688, 0.0979461669921875, 0.10646438598632812, 0.11498260498046875, 0.12350082397460938, 0.13201904296875, 0.14053726196289062, 0.14905548095703125, 0.15757369995117188, 0.1660919189453125, 0.17461013793945312, 0.18312835693359375, 0.19164657592773438, 0.200164794921875, 0.20868301391601562, 0.21720123291015625, 0.22571945190429688, 0.2342376708984375, 0.24275588989257812, 0.25127410888671875, 0.2597923278808594, 0.268310546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 14.0, 14.0, 14.0, 15.0, 18.0, 22.0, 28.0, 37.0, 37.0, 33.0, 62.0, 50.0, 51.0, 49.0, 67.0, 47.0, 54.0, 50.0, 48.0, 42.0, 36.0, 40.0, 24.0, 30.0, 20.0, 17.0, 15.0, 7.0, 6.0, 3.0, 8.0, 2.0, 9.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013875961303710938, -0.0001340322196483612, -0.00012930482625961304, -0.00012457743287086487, -0.0001198500394821167, -0.00011512264609336853, -0.00011039525270462036, -0.00010566785931587219, -0.00010094046592712402, -9.621307253837585e-05, -9.148567914962769e-05, -8.675828576087952e-05, -8.203089237213135e-05, -7.730349898338318e-05, -7.257610559463501e-05, -6.784871220588684e-05, -6.312131881713867e-05, -5.83939254283905e-05, -5.3666532039642334e-05, -4.8939138650894165e-05, -4.4211745262145996e-05, -3.948435187339783e-05, -3.475695848464966e-05, -3.002956509590149e-05, -2.530217170715332e-05, -2.057477831840515e-05, -1.5847384929656982e-05, -1.1119991540908813e-05, -6.3925981521606445e-06, -1.6652047634124756e-06, 3.0621886253356934e-06, 7.789582014083862e-06, 1.2516975402832031e-05, 1.72443687915802e-05, 2.197176218032837e-05, 2.6699155569076538e-05, 3.142654895782471e-05, 3.6153942346572876e-05, 4.0881335735321045e-05, 4.5608729124069214e-05, 5.033612251281738e-05, 5.506351590156555e-05, 5.979090929031372e-05, 6.451830267906189e-05, 6.924569606781006e-05, 7.397308945655823e-05, 7.87004828453064e-05, 8.342787623405457e-05, 8.815526962280273e-05, 9.28826630115509e-05, 9.761005640029907e-05, 0.00010233744978904724, 0.00010706484317779541, 0.00011179223656654358, 0.00011651962995529175, 0.00012124702334403992, 0.00012597441673278809, 0.00013070181012153625, 0.00013542920351028442, 0.0001401565968990326, 0.00014488399028778076, 0.00014961138367652893, 0.0001543387770652771, 0.00015906617045402527, 0.00016379356384277344]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 12.0, 6.0, 13.0, 5.0, 9.0, 16.0, 12.0, 36.0, 44.0, 64.0, 67.0, 101.0, 162.0, 187.0, 282.0, 483.0, 999.0, 80256.0, 957159.0, 6674.0, 659.0, 392.0, 249.0, 173.0, 119.0, 82.0, 63.0, 59.0, 33.0, 26.0, 26.0, 16.0, 13.0, 14.0, 11.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0032215118408203125, -0.0031276047229766846, -0.0030336976051330566, -0.0029397904872894287, -0.0028458833694458008, -0.002751976251602173, -0.002658069133758545, -0.002564162015914917, -0.002470254898071289, -0.002376347780227661, -0.002282440662384033, -0.0021885335445404053, -0.0020946264266967773, -0.0020007193088531494, -0.0019068121910095215, -0.0018129050731658936, -0.0017189979553222656, -0.0016250908374786377, -0.0015311837196350098, -0.0014372766017913818, -0.001343369483947754, -0.001249462366104126, -0.001155555248260498, -0.0010616481304168701, -0.0009677410125732422, -0.0008738338947296143, -0.0007799267768859863, -0.0006860196590423584, -0.0005921125411987305, -0.0004982054233551025, -0.0004042983055114746, -0.0003103911876678467, -0.00021648406982421875, -0.00012257695198059082, -2.866983413696289e-05, 6.523728370666504e-05, 0.00015914440155029297, 0.0002530515193939209, 0.00034695863723754883, 0.00044086575508117676, 0.0005347728729248047, 0.0006286799907684326, 0.0007225871086120605, 0.0008164942264556885, 0.0009104013442993164, 0.0010043084621429443, 0.0010982155799865723, 0.0011921226978302002, 0.0012860298156738281, 0.001379936933517456, 0.001473844051361084, 0.001567751169204712, 0.0016616582870483398, 0.0017555654048919678, 0.0018494725227355957, 0.0019433796405792236, 0.0020372867584228516, 0.0021311938762664795, 0.0022251009941101074, 0.0023190081119537354, 0.0024129152297973633, 0.002506822347640991, 0.002600729465484619, 0.002694636583328247, 0.002788543701171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 65.0, 299.0, 409.0, 196.0, 30.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004159118980169296, -0.0004017203173134476, -0.00038752873660996556, -0.00037333715590648353, -0.0003591455752030015, -0.00034495399449951947, -0.00033076241379603744, -0.00031657086219638586, -0.00030237925238907337, -0.00028818767168559134, -0.0002739960909821093, -0.0002598045102786273, -0.00024561292957514524, -0.0002314213488716632, -0.0002172297827200964, -0.00020303820201661438, -0.00018884663586504757, -0.00017465505516156554, -0.0001604634744580835, -0.00014627189375460148, -0.00013208031305111945, -0.00011788873962359503, -0.00010369716619607061, -8.950558549258858e-05, -7.531400478910655e-05, -6.112242408562452e-05, -4.693084702012129e-05, -3.2739269954618067e-05, -1.8547689251136035e-05, -4.356108547654003e-06, 9.835464879870415e-06, 2.4027045583352447e-05, 3.821862628683448e-05, 5.241020699031651e-05, 6.660178769379854e-05, 8.079336112132296e-05, 9.498494182480499e-05, 0.00010917652252828702, 0.00012336809595581144, 0.00013755967665929347, 0.0001517512573627755, 0.00016594283806625754, 0.00018013441876973957, 0.00019432598492130637, 0.0002085175656247884, 0.00022270914632827044, 0.00023690072703175247, 0.0002510923077352345, 0.00026528388843871653, 0.00027947546914219856, 0.0002936670498456806, 0.0003078586305491626, 0.00032205021125264466, 0.0003362417919561267, 0.00035043334355577826, 0.00036462495336309075, 0.00037881650496274233, 0.00039300808566622436, 0.0004071996663697064, 0.0004213912470731884, 0.00043558282777667046, 0.0004497744084801525, 0.0004639659891836345, 0.0004781575407832861, 0.0004923491505905986]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 5.0, 12.0, 15.0, 21.0, 20.0, 22.0, 34.0, 40.0, 36.0, 38.0, 41.0, 40.0, 37.0, 43.0, 43.0, 47.0, 35.0, 39.0, 50.0, 48.0, 35.0, 39.0, 35.0, 34.0, 26.0, 21.0, 24.0, 18.0, 20.0, 15.0, 11.0, 14.0, 10.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.690357208251953e-05, -8.42418521642685e-05, -8.158013224601746e-05, -7.891841232776642e-05, -7.625669240951538e-05, -7.359497249126434e-05, -7.09332525730133e-05, -6.827153265476227e-05, -6.560981273651123e-05, -6.294809281826019e-05, -6.0286372900009155e-05, -5.762465298175812e-05, -5.496293306350708e-05, -5.230121314525604e-05, -4.9639493227005005e-05, -4.697777330875397e-05, -4.431605339050293e-05, -4.165433347225189e-05, -3.8992613554000854e-05, -3.633089363574982e-05, -3.366917371749878e-05, -3.100745379924774e-05, -2.8345733880996704e-05, -2.5684013962745667e-05, -2.302229404449463e-05, -2.036057412624359e-05, -1.7698854207992554e-05, -1.5037134289741516e-05, -1.2375414371490479e-05, -9.713694453239441e-06, -7.051974534988403e-06, -4.390254616737366e-06, -1.7285346984863281e-06, 9.331852197647095e-07, 3.594905138015747e-06, 6.256625056266785e-06, 8.918344974517822e-06, 1.158006489276886e-05, 1.4241784811019897e-05, 1.6903504729270935e-05, 1.9565224647521973e-05, 2.222694456577301e-05, 2.4888664484024048e-05, 2.7550384402275085e-05, 3.0212104320526123e-05, 3.287382423877716e-05, 3.55355441570282e-05, 3.8197264075279236e-05, 4.0858983993530273e-05, 4.352070391178131e-05, 4.618242383003235e-05, 4.8844143748283386e-05, 5.1505863666534424e-05, 5.416758358478546e-05, 5.68293035030365e-05, 5.949102342128754e-05, 6.215274333953857e-05, 6.481446325778961e-05, 6.747618317604065e-05, 7.013790309429169e-05, 7.279962301254272e-05, 7.546134293079376e-05, 7.81230628490448e-05, 8.078478276729584e-05, 8.344650268554688e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 5.0, 11.0, 7.0, 10.0, 10.0, 16.0, 12.0, 15.0, 15.0, 18.0, 11.0, 22.0, 33.0, 27.0, 34.0, 41.0, 36.0, 32.0, 40.0, 52.0, 35.0, 39.0, 30.0, 36.0, 42.0, 40.0, 40.0, 28.0, 34.0, 22.0, 23.0, 26.0, 21.0, 25.0, 19.0, 15.0, 9.0, 12.0, 8.0, 7.0, 4.0, 4.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.669921875, -1.621978759765625, -1.57403564453125, -1.526092529296875, -1.4781494140625, -1.430206298828125, -1.38226318359375, -1.334320068359375, -1.286376953125, -1.238433837890625, -1.19049072265625, -1.142547607421875, -1.0946044921875, -1.046661376953125, -0.99871826171875, -0.950775146484375, -0.90283203125, -0.854888916015625, -0.80694580078125, -0.759002685546875, -0.7110595703125, -0.663116455078125, -0.61517333984375, -0.567230224609375, -0.519287109375, -0.471343994140625, -0.42340087890625, -0.375457763671875, -0.3275146484375, -0.279571533203125, -0.23162841796875, -0.183685302734375, -0.1357421875, -0.087799072265625, -0.03985595703125, 0.008087158203125, 0.0560302734375, 0.103973388671875, 0.15191650390625, 0.199859619140625, 0.247802734375, 0.295745849609375, 0.34368896484375, 0.391632080078125, 0.4395751953125, 0.487518310546875, 0.53546142578125, 0.583404541015625, 0.63134765625, 0.679290771484375, 0.72723388671875, 0.775177001953125, 0.8231201171875, 0.871063232421875, 0.91900634765625, 0.966949462890625, 1.014892578125, 1.062835693359375, 1.11077880859375, 1.158721923828125, 1.2066650390625, 1.254608154296875, 1.30255126953125, 1.350494384765625, 1.3984375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 7.0, 7.0, 12.0, 16.0, 24.0, 20.0, 42.0, 54.0, 84.0, 110.0, 183.0, 287.0, 433.0, 708.0, 1186.0, 1847.0, 3170.0, 5639.0, 10444.0, 21015.0, 43724.0, 91790.0, 175495.0, 250345.0, 209469.0, 118205.0, 57007.0, 26961.0, 13308.0, 7014.0, 3871.0, 2297.0, 1350.0, 877.0, 528.0, 336.0, 231.0, 156.0, 96.0, 60.0, 46.0, 25.0, 22.0, 16.0, 7.0, 8.0, 7.0, 10.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2685546875, -1.229736328125, -1.19091796875, -1.152099609375, -1.11328125, -1.074462890625, -1.03564453125, -0.996826171875, -0.9580078125, -0.919189453125, -0.88037109375, -0.841552734375, -0.802734375, -0.763916015625, -0.72509765625, -0.686279296875, -0.6474609375, -0.608642578125, -0.56982421875, -0.531005859375, -0.4921875, -0.453369140625, -0.41455078125, -0.375732421875, -0.3369140625, -0.298095703125, -0.25927734375, -0.220458984375, -0.181640625, -0.142822265625, -0.10400390625, -0.065185546875, -0.0263671875, 0.012451171875, 0.05126953125, 0.090087890625, 0.12890625, 0.167724609375, 0.20654296875, 0.245361328125, 0.2841796875, 0.322998046875, 0.36181640625, 0.400634765625, 0.439453125, 0.478271484375, 0.51708984375, 0.555908203125, 0.5947265625, 0.633544921875, 0.67236328125, 0.711181640625, 0.75, 0.788818359375, 0.82763671875, 0.866455078125, 0.9052734375, 0.944091796875, 0.98291015625, 1.021728515625, 1.060546875, 1.099365234375, 1.13818359375, 1.177001953125, 1.2158203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 10.0, 9.0, 10.0, 14.0, 14.0, 14.0, 14.0, 18.0, 22.0, 18.0, 30.0, 34.0, 36.0, 42.0, 36.0, 39.0, 80.0, 170.0, 336.0, 1387.0, 185.0, 90.0, 57.0, 50.0, 36.0, 36.0, 35.0, 21.0, 31.0, 18.0, 26.0, 24.0, 13.0, 13.0, 13.0, 15.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.84765625, -5.6761474609375, -5.504638671875, -5.3331298828125, -5.16162109375, -4.9901123046875, -4.818603515625, -4.6470947265625, -4.4755859375, -4.3040771484375, -4.132568359375, -3.9610595703125, -3.78955078125, -3.6180419921875, -3.446533203125, -3.2750244140625, -3.103515625, -2.9320068359375, -2.760498046875, -2.5889892578125, -2.41748046875, -2.2459716796875, -2.074462890625, -1.9029541015625, -1.7314453125, -1.5599365234375, -1.388427734375, -1.2169189453125, -1.04541015625, -0.8739013671875, -0.702392578125, -0.5308837890625, -0.359375, -0.1878662109375, -0.016357421875, 0.1551513671875, 0.32666015625, 0.4981689453125, 0.669677734375, 0.8411865234375, 1.0126953125, 1.1842041015625, 1.355712890625, 1.5272216796875, 1.69873046875, 1.8702392578125, 2.041748046875, 2.2132568359375, 2.384765625, 2.5562744140625, 2.727783203125, 2.8992919921875, 3.07080078125, 3.2423095703125, 3.413818359375, 3.5853271484375, 3.7568359375, 3.9283447265625, 4.099853515625, 4.2713623046875, 4.44287109375, 4.6143798828125, 4.785888671875, 4.9573974609375, 5.12890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 14.0, 15.0, 11.0, 17.0, 19.0, 24.0, 30.0, 47.0, 62.0, 72.0, 94.0, 123.0, 225.0, 454.0, 1225.0, 8544.0, 469153.0, 2633216.0, 28648.0, 2122.0, 631.0, 267.0, 187.0, 118.0, 87.0, 62.0, 38.0, 32.0, 33.0, 24.0, 23.0, 17.0, 14.0, 12.0, 5.0, 6.0, 4.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1778564453125, -8.863525390625, -8.5491943359375, -8.23486328125, -7.9205322265625, -7.606201171875, -7.2918701171875, -6.9775390625, -6.6632080078125, -6.348876953125, -6.0345458984375, -5.72021484375, -5.4058837890625, -5.091552734375, -4.7772216796875, -4.462890625, -4.1485595703125, -3.834228515625, -3.5198974609375, -3.20556640625, -2.8912353515625, -2.576904296875, -2.2625732421875, -1.9482421875, -1.6339111328125, -1.319580078125, -1.0052490234375, -0.69091796875, -0.3765869140625, -0.062255859375, 0.2520751953125, 0.56640625, 0.8807373046875, 1.195068359375, 1.5093994140625, 1.82373046875, 2.1380615234375, 2.452392578125, 2.7667236328125, 3.0810546875, 3.3953857421875, 3.709716796875, 4.0240478515625, 4.33837890625, 4.6527099609375, 4.967041015625, 5.2813720703125, 5.595703125, 5.9100341796875, 6.224365234375, 6.5386962890625, 6.85302734375, 7.1673583984375, 7.481689453125, 7.7960205078125, 8.1103515625, 8.4246826171875, 8.739013671875, 9.0533447265625, 9.36767578125, 9.6820068359375, 9.996337890625, 10.3106689453125, 10.625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 125.0, 449.0, 360.0, 64.0, 9.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.02841186523438, -70.76129913330078, -69.49418640136719, -68.2270736694336, -66.95996856689453, -65.69285583496094, -64.42574310302734, -63.15863037109375, -61.891517639160156, -60.62440490722656, -59.357295989990234, -58.09018325805664, -56.82307052612305, -55.55595779418945, -54.288848876953125, -53.02173614501953, -51.75462341308594, -50.487510681152344, -49.220401763916016, -47.95328903198242, -46.68617630004883, -45.419063568115234, -44.151954650878906, -42.88484191894531, -41.617733001708984, -40.35062026977539, -39.08351135253906, -37.81639862060547, -36.549285888671875, -35.28217315673828, -34.01506423950195, -32.74795150756836, -31.4808349609375, -30.21372413635254, -28.946611404418945, -27.679500579833984, -26.41238784790039, -25.14527702331543, -23.87816619873047, -22.611053466796875, -21.343942642211914, -20.076831817626953, -18.80971908569336, -17.5426082611084, -16.275495529174805, -15.008384704589844, -13.741272926330566, -12.474161148071289, -11.207049369812012, -9.939937591552734, -8.672825813293457, -7.405714511871338, -6.1386027336120605, -4.871490955352783, -3.604379653930664, -2.3372678756713867, -1.0701560974121094, 0.19695556163787842, 1.4640672206878662, 2.7311787605285645, 3.998290538787842, 5.265402317047119, 6.532513618469238, 7.799625396728516, 9.066737174987793]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 4.0, 4.0, 10.0, 6.0, 8.0, 8.0, 10.0, 12.0, 20.0, 26.0, 19.0, 32.0, 28.0, 35.0, 27.0, 38.0, 35.0, 33.0, 58.0, 57.0, 48.0, 55.0, 53.0, 52.0, 45.0, 36.0, 49.0, 28.0, 30.0, 19.0, 25.0, 20.0, 16.0, 5.0, 14.0, 10.0, 10.0, 8.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34966278076172, -22.683855056762695, -22.018049240112305, -21.35224151611328, -20.68643569946289, -20.020627975463867, -19.354822158813477, -18.689014434814453, -18.023208618164062, -17.35740089416504, -16.69159507751465, -16.025787353515625, -15.359981536865234, -14.694174766540527, -14.02836799621582, -13.362560272216797, -12.69675350189209, -12.030946731567383, -11.365139961242676, -10.699333190917969, -10.033526420593262, -9.367719650268555, -8.701911926269531, -8.03610610961914, -7.370298862457275, -6.704492092132568, -6.038685321807861, -5.372878074645996, -4.707071304321289, -4.041264533996582, -3.375457763671875, -2.709650993347168, -2.043844223022461, -1.378037452697754, -0.7122305631637573, -0.04642367362976074, 0.6193830966949463, 1.2851898670196533, 1.9509968757629395, 2.6168036460876465, 3.2826104164123535, 3.9484171867370605, 4.614223957061768, 5.280031204223633, 5.94583797454834, 6.611644744873047, 7.277451515197754, 7.943258285522461, 8.609065055847168, 9.274871826171875, 9.940678596496582, 10.606485366821289, 11.272292137145996, 11.938098907470703, 12.603906631469727, 13.269712448120117, 13.93552017211914, 14.601326942443848, 15.267133712768555, 15.932940483093262, 16.59874725341797, 17.264554977416992, 17.930360794067383, 18.596168518066406, 19.261974334716797]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 3.0, 6.0, 10.0, 5.0, 9.0, 6.0, 10.0, 17.0, 16.0, 17.0, 11.0, 19.0, 23.0, 23.0, 23.0, 32.0, 33.0, 33.0, 38.0, 38.0, 51.0, 44.0, 44.0, 42.0, 37.0, 31.0, 43.0, 32.0, 23.0, 44.0, 30.0, 26.0, 30.0, 27.0, 17.0, 19.0, 19.0, 14.0, 13.0, 10.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8212890625, -1.768798828125, -1.71630859375, -1.663818359375, -1.611328125, -1.558837890625, -1.50634765625, -1.453857421875, -1.4013671875, -1.348876953125, -1.29638671875, -1.243896484375, -1.19140625, -1.138916015625, -1.08642578125, -1.033935546875, -0.9814453125, -0.928955078125, -0.87646484375, -0.823974609375, -0.771484375, -0.718994140625, -0.66650390625, -0.614013671875, -0.5615234375, -0.509033203125, -0.45654296875, -0.404052734375, -0.3515625, -0.299072265625, -0.24658203125, -0.194091796875, -0.1416015625, -0.089111328125, -0.03662109375, 0.015869140625, 0.068359375, 0.120849609375, 0.17333984375, 0.225830078125, 0.2783203125, 0.330810546875, 0.38330078125, 0.435791015625, 0.48828125, 0.540771484375, 0.59326171875, 0.645751953125, 0.6982421875, 0.750732421875, 0.80322265625, 0.855712890625, 0.908203125, 0.960693359375, 1.01318359375, 1.065673828125, 1.1181640625, 1.170654296875, 1.22314453125, 1.275634765625, 1.328125, 1.380615234375, 1.43310546875, 1.485595703125, 1.5380859375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 8.0, 5.0, 4.0, 9.0, 4.0, 6.0, 9.0, 14.0, 13.0, 14.0, 16.0, 30.0, 29.0, 32.0, 54.0, 89.0, 113.0, 172.0, 373.0, 990.0, 3548.0, 18383.0, 149730.0, 1502618.0, 2180789.0, 298345.0, 30909.0, 5402.0, 1369.0, 509.0, 225.0, 136.0, 80.0, 51.0, 47.0, 36.0, 34.0, 18.0, 18.0, 13.0, 7.0, 10.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.609375, -4.47027587890625, -4.3311767578125, -4.19207763671875, -4.052978515625, -3.91387939453125, -3.7747802734375, -3.63568115234375, -3.49658203125, -3.35748291015625, -3.2183837890625, -3.07928466796875, -2.940185546875, -2.80108642578125, -2.6619873046875, -2.52288818359375, -2.3837890625, -2.24468994140625, -2.1055908203125, -1.96649169921875, -1.827392578125, -1.68829345703125, -1.5491943359375, -1.41009521484375, -1.27099609375, -1.13189697265625, -0.9927978515625, -0.85369873046875, -0.714599609375, -0.57550048828125, -0.4364013671875, -0.29730224609375, -0.158203125, -0.01910400390625, 0.1199951171875, 0.25909423828125, 0.398193359375, 0.53729248046875, 0.6763916015625, 0.81549072265625, 0.95458984375, 1.09368896484375, 1.2327880859375, 1.37188720703125, 1.510986328125, 1.65008544921875, 1.7891845703125, 1.92828369140625, 2.0673828125, 2.20648193359375, 2.3455810546875, 2.48468017578125, 2.623779296875, 2.76287841796875, 2.9019775390625, 3.04107666015625, 3.18017578125, 3.31927490234375, 3.4583740234375, 3.59747314453125, 3.736572265625, 3.87567138671875, 4.0147705078125, 4.15386962890625, 4.29296875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 5.0, 6.0, 6.0, 14.0, 14.0, 25.0, 41.0, 50.0, 56.0, 80.0, 119.0, 185.0, 248.0, 312.0, 425.0, 491.0, 475.0, 375.0, 308.0, 236.0, 184.0, 126.0, 91.0, 57.0, 46.0, 22.0, 28.0, 14.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.9266357421875, -4.767333984375, -4.6080322265625, -4.44873046875, -4.2894287109375, -4.130126953125, -3.9708251953125, -3.8115234375, -3.6522216796875, -3.492919921875, -3.3336181640625, -3.17431640625, -3.0150146484375, -2.855712890625, -2.6964111328125, -2.537109375, -2.3778076171875, -2.218505859375, -2.0592041015625, -1.89990234375, -1.7406005859375, -1.581298828125, -1.4219970703125, -1.2626953125, -1.1033935546875, -0.944091796875, -0.7847900390625, -0.62548828125, -0.4661865234375, -0.306884765625, -0.1475830078125, 0.01171875, 0.1710205078125, 0.330322265625, 0.4896240234375, 0.64892578125, 0.8082275390625, 0.967529296875, 1.1268310546875, 1.2861328125, 1.4454345703125, 1.604736328125, 1.7640380859375, 1.92333984375, 2.0826416015625, 2.241943359375, 2.4012451171875, 2.560546875, 2.7198486328125, 2.879150390625, 3.0384521484375, 3.19775390625, 3.3570556640625, 3.516357421875, 3.6756591796875, 3.8349609375, 3.9942626953125, 4.153564453125, 4.3128662109375, 4.47216796875, 4.6314697265625, 4.790771484375, 4.9500732421875, 5.109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 12.0, 8.0, 17.0, 18.0, 40.0, 54.0, 102.0, 120.0, 215.0, 416.0, 1050.0, 4953.0, 71356.0, 2616572.0, 1456444.0, 37808.0, 3313.0, 861.0, 341.0, 188.0, 123.0, 84.0, 46.0, 42.0, 30.0, 20.0, 10.0, 7.0, 7.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.8238525390625, -9.444580078125, -9.0653076171875, -8.68603515625, -8.3067626953125, -7.927490234375, -7.5482177734375, -7.1689453125, -6.7896728515625, -6.410400390625, -6.0311279296875, -5.65185546875, -5.2725830078125, -4.893310546875, -4.5140380859375, -4.134765625, -3.7554931640625, -3.376220703125, -2.9969482421875, -2.61767578125, -2.2384033203125, -1.859130859375, -1.4798583984375, -1.1005859375, -0.7213134765625, -0.342041015625, 0.0372314453125, 0.41650390625, 0.7957763671875, 1.175048828125, 1.5543212890625, 1.93359375, 2.3128662109375, 2.692138671875, 3.0714111328125, 3.45068359375, 3.8299560546875, 4.209228515625, 4.5885009765625, 4.9677734375, 5.3470458984375, 5.726318359375, 6.1055908203125, 6.48486328125, 6.8641357421875, 7.243408203125, 7.6226806640625, 8.001953125, 8.3812255859375, 8.760498046875, 9.1397705078125, 9.51904296875, 9.8983154296875, 10.277587890625, 10.6568603515625, 11.0361328125, 11.4154052734375, 11.794677734375, 12.1739501953125, 12.55322265625, 12.9324951171875, 13.311767578125, 13.6910400390625, 14.0703125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 26.0, 33.0, 78.0, 105.0, 153.0, 168.0, 138.0, 125.0, 86.0, 51.0, 23.0, 11.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.65777587890625, -12.658008575439453, -11.658241271972656, -10.65847396850586, -9.658706665039062, -8.658939361572266, -7.659172534942627, -6.65940523147583, -5.659637928009033, -4.659870624542236, -3.6601033210754395, -2.6603362560272217, -1.6605689525604248, -0.660801887512207, 0.33896541595458984, 1.3387327194213867, 2.3385000228881836, 3.3382673263549805, 4.338034629821777, 5.337801933288574, 6.337569236755371, 7.33733606338501, 8.337102890014648, 9.336870193481445, 10.336637496948242, 11.336404800415039, 12.336172103881836, 13.335939407348633, 14.33570671081543, 15.335474014282227, 16.335241317749023, 17.33500862121582, 18.334775924682617, 19.334543228149414, 20.33431053161621, 21.334077835083008, 22.333845138549805, 23.3336124420166, 24.3333797454834, 25.333147048950195, 26.332914352416992, 27.33268165588379, 28.332448959350586, 29.332216262817383, 30.33198356628418, 31.331750869750977, 32.33151626586914, 33.33128356933594, 34.331050872802734, 35.33081817626953, 36.33058547973633, 37.330352783203125, 38.33012008666992, 39.32988739013672, 40.329654693603516, 41.32942199707031, 42.32918930053711, 43.328956604003906, 44.3287239074707, 45.3284912109375, 46.3282585144043, 47.328025817871094, 48.32779312133789, 49.32756042480469, 50.327327728271484]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 8.0, 4.0, 5.0, 4.0, 4.0, 13.0, 7.0, 20.0, 14.0, 15.0, 18.0, 26.0, 23.0, 26.0, 30.0, 35.0, 34.0, 40.0, 42.0, 46.0, 40.0, 46.0, 42.0, 47.0, 45.0, 41.0, 36.0, 32.0, 31.0, 31.0, 28.0, 25.0, 25.0, 32.0, 17.0, 10.0, 10.0, 9.0, 14.0, 6.0, 8.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.956981658935547, -13.46343994140625, -12.969898223876953, -12.476357460021973, -11.982815742492676, -11.489274024963379, -10.995733261108398, -10.502191543579102, -10.008649826049805, -9.515108108520508, -9.021566390991211, -8.52802562713623, -8.034483909606934, -7.540942192077637, -7.047400951385498, -6.553859710693359, -6.0603179931640625, -5.566776275634766, -5.073235034942627, -4.579693794250488, -4.086152076721191, -3.5926105976104736, -3.099069118499756, -2.605527639389038, -2.1119861602783203, -1.6184446811676025, -1.1249032020568848, -0.631361722946167, -0.13782024383544922, 0.35572123527526855, 0.8492627143859863, 1.342804193496704, 1.8363456726074219, 2.3298871517181396, 2.8234286308288574, 3.316970109939575, 3.810511589050293, 4.30405330657959, 4.7975945472717285, 5.291135787963867, 5.784677505493164, 6.278219223022461, 6.7717604637146, 7.265301704406738, 7.758843421936035, 8.252385139465332, 8.745925903320312, 9.23946762084961, 9.733009338378906, 10.226551055908203, 10.7200927734375, 11.21363353729248, 11.707175254821777, 12.200716972351074, 12.694257736206055, 13.187799453735352, 13.681341171264648, 14.174882888793945, 14.668424606323242, 15.161965370178223, 15.65550708770752, 16.1490478515625, 16.642589569091797, 17.136131286621094, 17.62967300415039]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 7.0, 5.0, 6.0, 4.0, 12.0, 11.0, 15.0, 10.0, 22.0, 13.0, 15.0, 15.0, 26.0, 23.0, 21.0, 32.0, 35.0, 34.0, 38.0, 45.0, 42.0, 46.0, 44.0, 49.0, 42.0, 34.0, 39.0, 31.0, 25.0, 34.0, 27.0, 27.0, 17.0, 23.0, 19.0, 18.0, 18.0, 14.0, 11.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5201416015625, -1.468017578125, -1.4158935546875, -1.36376953125, -1.3116455078125, -1.259521484375, -1.2073974609375, -1.1552734375, -1.1031494140625, -1.051025390625, -0.9989013671875, -0.94677734375, -0.8946533203125, -0.842529296875, -0.7904052734375, -0.73828125, -0.6861572265625, -0.634033203125, -0.5819091796875, -0.52978515625, -0.4776611328125, -0.425537109375, -0.3734130859375, -0.3212890625, -0.2691650390625, -0.217041015625, -0.1649169921875, -0.11279296875, -0.0606689453125, -0.008544921875, 0.0435791015625, 0.095703125, 0.1478271484375, 0.199951171875, 0.2520751953125, 0.30419921875, 0.3563232421875, 0.408447265625, 0.4605712890625, 0.5126953125, 0.5648193359375, 0.616943359375, 0.6690673828125, 0.72119140625, 0.7733154296875, 0.825439453125, 0.8775634765625, 0.9296875, 0.9818115234375, 1.033935546875, 1.0860595703125, 1.13818359375, 1.1903076171875, 1.242431640625, 1.2945556640625, 1.3466796875, 1.3988037109375, 1.450927734375, 1.5030517578125, 1.55517578125, 1.6072998046875, 1.659423828125, 1.7115478515625, 1.763671875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 8.0, 13.0, 12.0, 15.0, 26.0, 40.0, 68.0, 106.0, 124.0, 193.0, 326.0, 435.0, 618.0, 834.0, 1183.0, 1702.0, 2553.0, 3679.0, 5353.0, 7847.0, 11582.0, 17610.0, 26781.0, 41993.0, 68393.0, 123064.0, 260443.0, 204910.0, 101747.0, 58728.0, 36425.0, 23472.0, 15467.0, 10435.0, 6842.0, 4816.0, 3306.0, 2267.0, 1573.0, 1078.0, 729.0, 540.0, 379.0, 273.0, 192.0, 120.0, 88.0, 58.0, 42.0, 30.0, 17.0, 14.0, 9.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29724884033203125, -0.2876129150390625, -0.27797698974609375, -0.268341064453125, -0.25870513916015625, -0.2490692138671875, -0.23943328857421875, -0.22979736328125, -0.22016143798828125, -0.2105255126953125, -0.20088958740234375, -0.191253662109375, -0.18161773681640625, -0.1719818115234375, -0.16234588623046875, -0.1527099609375, -0.14307403564453125, -0.1334381103515625, -0.12380218505859375, -0.114166259765625, -0.10453033447265625, -0.0948944091796875, -0.08525848388671875, -0.07562255859375, -0.06598663330078125, -0.0563507080078125, -0.04671478271484375, -0.037078857421875, -0.02744293212890625, -0.0178070068359375, -0.00817108154296875, 0.00146484375, 0.01110076904296875, 0.0207366943359375, 0.03037261962890625, 0.040008544921875, 0.04964447021484375, 0.0592803955078125, 0.06891632080078125, 0.07855224609375, 0.08818817138671875, 0.0978240966796875, 0.10746002197265625, 0.117095947265625, 0.12673187255859375, 0.1363677978515625, 0.14600372314453125, 0.1556396484375, 0.16527557373046875, 0.1749114990234375, 0.18454742431640625, 0.194183349609375, 0.20381927490234375, 0.2134552001953125, 0.22309112548828125, 0.23272705078125, 0.24236297607421875, 0.2519989013671875, 0.26163482666015625, 0.271270751953125, 0.28090667724609375, 0.2905426025390625, 0.30017852783203125, 0.309814453125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 12.0, 10.0, 12.0, 14.0, 16.0, 7.0, 16.0, 24.0, 21.0, 36.0, 28.0, 28.0, 26.0, 36.0, 24.0, 29.0, 29.0, 35.0, 30.0, 1053.0, 41.0, 34.0, 34.0, 34.0, 33.0, 32.0, 17.0, 33.0, 32.0, 25.0, 29.0, 24.0, 11.0, 33.0, 19.0, 18.0, 12.0, 11.0, 11.0, 7.0, 9.0, 12.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.9716796875, -0.9411544799804688, -0.9106292724609375, -0.8801040649414062, -0.849578857421875, -0.8190536499023438, -0.7885284423828125, -0.7580032348632812, -0.72747802734375, -0.6969528198242188, -0.6664276123046875, -0.6359024047851562, -0.605377197265625, -0.5748519897460938, -0.5443267822265625, -0.5138015747070312, -0.4832763671875, -0.45275115966796875, -0.4222259521484375, -0.39170074462890625, -0.361175537109375, -0.33065032958984375, -0.3001251220703125, -0.26959991455078125, -0.23907470703125, -0.20854949951171875, -0.1780242919921875, -0.14749908447265625, -0.116973876953125, -0.08644866943359375, -0.0559234619140625, -0.02539825439453125, 0.005126953125, 0.03565216064453125, 0.0661773681640625, 0.09670257568359375, 0.127227783203125, 0.15775299072265625, 0.1882781982421875, 0.21880340576171875, 0.24932861328125, 0.27985382080078125, 0.3103790283203125, 0.34090423583984375, 0.371429443359375, 0.40195465087890625, 0.4324798583984375, 0.46300506591796875, 0.4935302734375, 0.5240554809570312, 0.5545806884765625, 0.5851058959960938, 0.615631103515625, 0.6461563110351562, 0.6766815185546875, 0.7072067260742188, 0.73773193359375, 0.7682571411132812, 0.7987823486328125, 0.8293075561523438, 0.859832763671875, 0.8903579711914062, 0.9208831787109375, 0.9514083862304688, 0.98193359375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 11.0, 12.0, 13.0, 33.0, 53.0, 69.0, 100.0, 154.0, 242.0, 337.0, 497.0, 675.0, 1068.0, 1527.0, 2198.0, 3210.0, 4756.0, 6877.0, 10084.0, 15034.0, 22642.0, 34203.0, 54086.0, 88535.0, 159527.0, 1307727.0, 149491.0, 83884.0, 51114.0, 32801.0, 21511.0, 14145.0, 9527.0, 6458.0, 4467.0, 3145.0, 2153.0, 1540.0, 1057.0, 714.0, 502.0, 318.0, 229.0, 125.0, 98.0, 63.0, 55.0, 21.0, 16.0, 13.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.2646484375, -0.25623321533203125, -0.2478179931640625, -0.23940277099609375, -0.230987548828125, -0.22257232666015625, -0.2141571044921875, -0.20574188232421875, -0.19732666015625, -0.18891143798828125, -0.1804962158203125, -0.17208099365234375, -0.163665771484375, -0.15525054931640625, -0.1468353271484375, -0.13842010498046875, -0.1300048828125, -0.12158966064453125, -0.1131744384765625, -0.10475921630859375, -0.096343994140625, -0.08792877197265625, -0.0795135498046875, -0.07109832763671875, -0.06268310546875, -0.05426788330078125, -0.0458526611328125, -0.03743743896484375, -0.029022216796875, -0.02060699462890625, -0.0121917724609375, -0.00377655029296875, 0.004638671875, 0.01305389404296875, 0.0214691162109375, 0.02988433837890625, 0.038299560546875, 0.04671478271484375, 0.0551300048828125, 0.06354522705078125, 0.07196044921875, 0.08037567138671875, 0.0887908935546875, 0.09720611572265625, 0.105621337890625, 0.11403656005859375, 0.1224517822265625, 0.13086700439453125, 0.1392822265625, 0.14769744873046875, 0.1561126708984375, 0.16452789306640625, 0.172943115234375, 0.18135833740234375, 0.1897735595703125, 0.19818878173828125, 0.20660400390625, 0.21501922607421875, 0.2234344482421875, 0.23184967041015625, 0.240264892578125, 0.24868011474609375, 0.2570953369140625, 0.26551055908203125, 0.27392578125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 2.0, 8.0, 4.0, 11.0, 8.0, 10.0, 7.0, 10.0, 16.0, 17.0, 17.0, 17.0, 28.0, 44.0, 53.0, 45.0, 41.0, 64.0, 60.0, 59.0, 67.0, 48.0, 55.0, 36.0, 44.0, 43.0, 33.0, 23.0, 29.0, 19.0, 17.0, 13.0, 3.0, 5.0, 5.0, 9.0, 6.0, 8.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.00022685527801513672, -0.000220518559217453, -0.0002141818404197693, -0.00020784512162208557, -0.00020150840282440186, -0.00019517168402671814, -0.00018883496522903442, -0.0001824982464313507, -0.000176161527633667, -0.00016982480883598328, -0.00016348809003829956, -0.00015715137124061584, -0.00015081465244293213, -0.0001444779336452484, -0.0001381412148475647, -0.00013180449604988098, -0.00012546777725219727, -0.00011913105845451355, -0.00011279433965682983, -0.00010645762085914612, -0.0001001209020614624, -9.378418326377869e-05, -8.744746446609497e-05, -8.111074566841125e-05, -7.477402687072754e-05, -6.843730807304382e-05, -6.210058927536011e-05, -5.576387047767639e-05, -4.9427151679992676e-05, -4.309043288230896e-05, -3.6753714084625244e-05, -3.041699528694153e-05, -2.4080276489257812e-05, -1.7743557691574097e-05, -1.1406838893890381e-05, -5.070120096206665e-06, 1.2665987014770508e-06, 7.603317499160767e-06, 1.3940036296844482e-05, 2.0276755094528198e-05, 2.6613473892211914e-05, 3.295019268989563e-05, 3.9286911487579346e-05, 4.562363028526306e-05, 5.196034908294678e-05, 5.829706788063049e-05, 6.463378667831421e-05, 7.097050547599792e-05, 7.730722427368164e-05, 8.364394307136536e-05, 8.998066186904907e-05, 9.631738066673279e-05, 0.0001026540994644165, 0.00010899081826210022, 0.00011532753705978394, 0.00012166425585746765, 0.00012800097465515137, 0.00013433769345283508, 0.0001406744122505188, 0.00014701113104820251, 0.00015334784984588623, 0.00015968456864356995, 0.00016602128744125366, 0.00017235800623893738, 0.0001786947250366211]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 13.0, 11.0, 19.0, 25.0, 31.0, 40.0, 55.0, 56.0, 81.0, 83.0, 115.0, 187.0, 223.0, 356.0, 491.0, 1668.0, 133911.0, 899980.0, 8834.0, 794.0, 425.0, 295.0, 189.0, 144.0, 108.0, 67.0, 47.0, 58.0, 40.0, 26.0, 22.0, 24.0, 24.0, 19.0, 15.0, 16.0, 6.0, 9.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00284576416015625, -0.00274503231048584, -0.0026443004608154297, -0.0025435686111450195, -0.0024428367614746094, -0.0023421049118041992, -0.002241373062133789, -0.002140641212463379, -0.0020399093627929688, -0.0019391775131225586, -0.0018384456634521484, -0.0017377138137817383, -0.0016369819641113281, -0.001536250114440918, -0.0014355182647705078, -0.0013347864151000977, -0.0012340545654296875, -0.0011333227157592773, -0.0010325908660888672, -0.000931859016418457, -0.0008311271667480469, -0.0007303953170776367, -0.0006296634674072266, -0.0005289316177368164, -0.00042819976806640625, -0.0003274679183959961, -0.00022673606872558594, -0.00012600421905517578, -2.5272369384765625e-05, 7.545948028564453e-05, 0.0001761913299560547, 0.00027692317962646484, 0.000377655029296875, 0.00047838687896728516, 0.0005791187286376953, 0.0006798505783081055, 0.0007805824279785156, 0.0008813142776489258, 0.000982046127319336, 0.001082777976989746, 0.0011835098266601562, 0.0012842416763305664, 0.0013849735260009766, 0.0014857053756713867, 0.0015864372253417969, 0.001687169075012207, 0.0017879009246826172, 0.0018886327743530273, 0.0019893646240234375, 0.0020900964736938477, 0.002190828323364258, 0.002291560173034668, 0.002392292022705078, 0.0024930238723754883, 0.0025937557220458984, 0.0026944875717163086, 0.0027952194213867188, 0.002895951271057129, 0.002996683120727539, 0.0030974149703979492, 0.0031981468200683594, 0.0032988786697387695, 0.0033996105194091797, 0.00350034236907959, 0.00360107421875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 17.0, 39.0, 84.0, 172.0, 225.0, 210.0, 136.0, 67.0, 37.0, 14.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040207267738878727, -0.00039331018342636526, -0.0003845477185677737, -0.0003757852246053517, -0.0003670227306429297, -0.00035826023668050766, -0.0003494977718219161, -0.0003407352778594941, -0.0003319727838970721, -0.00032321028993465006, -0.0003144478250760585, -0.0003056853311136365, -0.0002969228371512145, -0.00028816034318879247, -0.0002793978783302009, -0.0002706353843677789, -0.0002618728904053569, -0.00025311039644293487, -0.0002443479315843433, -0.0002355854376219213, -0.0002268229436594993, -0.0002180604642489925, -0.00020929798483848572, -0.0002005354908760637, -0.00019177302601747215, -0.00018301054660696536, -0.00017424805264454335, -0.00016548557323403656, -0.00015672307927161455, -0.00014796059986110777, -0.00013919812045060098, -0.00013043562648817897, -0.00012167311797384173, -0.00011291063128737733, -0.00010414814460091293, -9.538566519040614e-05, -8.662317122798413e-05, -7.786069181747735e-05, -6.909820513101295e-05, -6.033571844454855e-05, -5.157323175808415e-05, -4.281074507161975e-05, -3.404825838515535e-05, -2.5285775336669758e-05, -1.652328865020536e-05, -7.76080196374096e-06, 1.0016810847446322e-06, 9.764167771209031e-06, 1.852665445767343e-05, 2.728914114413783e-05, 3.605162783060223e-05, 4.481411087908782e-05, 5.357659756555222e-05, 6.233908061403781e-05, 7.110156730050221e-05, 7.986405398696661e-05, 8.862654067343101e-05, 9.738902735989541e-05, 0.00010615151404635981, 0.0001149140007328242, 0.000123676480143331, 0.000132438974105753, 0.0001412014535162598, 0.0001499639474786818, 0.0001587264268891886]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 8.0, 15.0, 13.0, 13.0, 20.0, 22.0, 15.0, 26.0, 33.0, 24.0, 28.0, 55.0, 35.0, 35.0, 37.0, 43.0, 42.0, 29.0, 35.0, 27.0, 41.0, 37.0, 32.0, 33.0, 21.0, 35.0, 35.0, 22.0, 24.0, 31.0, 16.0, 20.0, 16.0, 13.0, 12.0, 6.0, 2.0, 7.0, 3.0, 9.0, 1.0, 4.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00010120868682861328, -9.79127362370491e-05, -9.461678564548492e-05, -9.132083505392075e-05, -8.802488446235657e-05, -8.472893387079239e-05, -8.143298327922821e-05, -7.813703268766403e-05, -7.484108209609985e-05, -7.154513150453568e-05, -6.82491809129715e-05, -6.495323032140732e-05, -6.165727972984314e-05, -5.836132913827896e-05, -5.506537854671478e-05, -5.1769427955150604e-05, -4.8473477363586426e-05, -4.517752677202225e-05, -4.188157618045807e-05, -3.858562558889389e-05, -3.528967499732971e-05, -3.1993724405765533e-05, -2.8697773814201355e-05, -2.5401823222637177e-05, -2.2105872631072998e-05, -1.880992203950882e-05, -1.551397144794464e-05, -1.2218020856380463e-05, -8.922070264816284e-06, -5.626119673252106e-06, -2.3301690816879272e-06, 9.657815098762512e-07, 4.26173210144043e-06, 7.557682693004608e-06, 1.0853633284568787e-05, 1.4149583876132965e-05, 1.7445534467697144e-05, 2.0741485059261322e-05, 2.40374356508255e-05, 2.733338624238968e-05, 3.062933683395386e-05, 3.3925287425518036e-05, 3.7221238017082214e-05, 4.051718860864639e-05, 4.381313920021057e-05, 4.710908979177475e-05, 5.040504038333893e-05, 5.370099097490311e-05, 5.6996941566467285e-05, 6.0292892158031464e-05, 6.358884274959564e-05, 6.688479334115982e-05, 7.0180743932724e-05, 7.347669452428818e-05, 7.677264511585236e-05, 8.006859570741653e-05, 8.336454629898071e-05, 8.666049689054489e-05, 8.995644748210907e-05, 9.325239807367325e-05, 9.654834866523743e-05, 9.98442992568016e-05, 0.00010314024984836578, 0.00010643620043992996, 0.00010973215103149414]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 7.0, 5.0, 6.0, 4.0, 12.0, 11.0, 15.0, 10.0, 22.0, 13.0, 15.0, 15.0, 26.0, 23.0, 21.0, 32.0, 35.0, 34.0, 38.0, 45.0, 42.0, 46.0, 44.0, 49.0, 42.0, 34.0, 39.0, 31.0, 25.0, 34.0, 27.0, 27.0, 17.0, 23.0, 19.0, 18.0, 18.0, 14.0, 11.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5201416015625, -1.468017578125, -1.4158935546875, -1.36376953125, -1.3116455078125, -1.259521484375, -1.2073974609375, -1.1552734375, -1.1031494140625, -1.051025390625, -0.9989013671875, -0.94677734375, -0.8946533203125, -0.842529296875, -0.7904052734375, -0.73828125, -0.6861572265625, -0.634033203125, -0.5819091796875, -0.52978515625, -0.4776611328125, -0.425537109375, -0.3734130859375, -0.3212890625, -0.2691650390625, -0.217041015625, -0.1649169921875, -0.11279296875, -0.0606689453125, -0.008544921875, 0.0435791015625, 0.095703125, 0.1478271484375, 0.199951171875, 0.2520751953125, 0.30419921875, 0.3563232421875, 0.408447265625, 0.4605712890625, 0.5126953125, 0.5648193359375, 0.616943359375, 0.6690673828125, 0.72119140625, 0.7733154296875, 0.825439453125, 0.8775634765625, 0.9296875, 0.9818115234375, 1.033935546875, 1.0860595703125, 1.13818359375, 1.1903076171875, 1.242431640625, 1.2945556640625, 1.3466796875, 1.3988037109375, 1.450927734375, 1.5030517578125, 1.55517578125, 1.6072998046875, 1.659423828125, 1.7115478515625, 1.763671875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 12.0, 10.0, 14.0, 17.0, 26.0, 29.0, 49.0, 60.0, 90.0, 123.0, 178.0, 277.0, 388.0, 587.0, 981.0, 1692.0, 2917.0, 5442.0, 10368.0, 22412.0, 56867.0, 184221.0, 455573.0, 197669.0, 60898.0, 23707.0, 10616.0, 5503.0, 3035.0, 1821.0, 1071.0, 624.0, 402.0, 263.0, 174.0, 121.0, 98.0, 59.0, 45.0, 30.0, 25.0, 15.0, 11.0, 12.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.251953125, -2.175689697265625, -2.09942626953125, -2.023162841796875, -1.9468994140625, -1.870635986328125, -1.79437255859375, -1.718109130859375, -1.641845703125, -1.565582275390625, -1.48931884765625, -1.413055419921875, -1.3367919921875, -1.260528564453125, -1.18426513671875, -1.108001708984375, -1.03173828125, -0.955474853515625, -0.87921142578125, -0.802947998046875, -0.7266845703125, -0.650421142578125, -0.57415771484375, -0.497894287109375, -0.421630859375, -0.345367431640625, -0.26910400390625, -0.192840576171875, -0.1165771484375, -0.040313720703125, 0.03594970703125, 0.112213134765625, 0.1884765625, 0.264739990234375, 0.34100341796875, 0.417266845703125, 0.4935302734375, 0.569793701171875, 0.64605712890625, 0.722320556640625, 0.798583984375, 0.874847412109375, 0.95111083984375, 1.027374267578125, 1.1036376953125, 1.179901123046875, 1.25616455078125, 1.332427978515625, 1.40869140625, 1.484954833984375, 1.56121826171875, 1.637481689453125, 1.7137451171875, 1.790008544921875, 1.86627197265625, 1.942535400390625, 2.018798828125, 2.095062255859375, 2.17132568359375, 2.247589111328125, 2.3238525390625, 2.400115966796875, 2.47637939453125, 2.552642822265625, 2.62890625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 5.0, 6.0, 10.0, 15.0, 10.0, 12.0, 16.0, 14.0, 15.0, 14.0, 25.0, 20.0, 31.0, 42.0, 43.0, 44.0, 43.0, 73.0, 110.0, 182.0, 1392.0, 296.0, 129.0, 79.0, 54.0, 42.0, 47.0, 30.0, 30.0, 27.0, 20.0, 23.0, 21.0, 26.0, 25.0, 9.0, 15.0, 11.0, 5.0, 8.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76171875, -5.5743408203125, -5.386962890625, -5.1995849609375, -5.01220703125, -4.8248291015625, -4.637451171875, -4.4500732421875, -4.2626953125, -4.0753173828125, -3.887939453125, -3.7005615234375, -3.51318359375, -3.3258056640625, -3.138427734375, -2.9510498046875, -2.763671875, -2.5762939453125, -2.388916015625, -2.2015380859375, -2.01416015625, -1.8267822265625, -1.639404296875, -1.4520263671875, -1.2646484375, -1.0772705078125, -0.889892578125, -0.7025146484375, -0.51513671875, -0.3277587890625, -0.140380859375, 0.0469970703125, 0.234375, 0.4217529296875, 0.609130859375, 0.7965087890625, 0.98388671875, 1.1712646484375, 1.358642578125, 1.5460205078125, 1.7333984375, 1.9207763671875, 2.108154296875, 2.2955322265625, 2.48291015625, 2.6702880859375, 2.857666015625, 3.0450439453125, 3.232421875, 3.4197998046875, 3.607177734375, 3.7945556640625, 3.98193359375, 4.1693115234375, 4.356689453125, 4.5440673828125, 4.7314453125, 4.9188232421875, 5.106201171875, 5.2935791015625, 5.48095703125, 5.6683349609375, 5.855712890625, 6.0430908203125, 6.23046875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 2.0, 7.0, 11.0, 21.0, 38.0, 39.0, 73.0, 117.0, 181.0, 374.0, 1246.0, 36173.0, 3093095.0, 12571.0, 943.0, 320.0, 165.0, 98.0, 66.0, 48.0, 34.0, 20.0, 22.0, 15.0, 6.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.5625, -25.790283203125, -25.01806640625, -24.245849609375, -23.4736328125, -22.701416015625, -21.92919921875, -21.156982421875, -20.384765625, -19.612548828125, -18.84033203125, -18.068115234375, -17.2958984375, -16.523681640625, -15.75146484375, -14.979248046875, -14.20703125, -13.434814453125, -12.66259765625, -11.890380859375, -11.1181640625, -10.345947265625, -9.57373046875, -8.801513671875, -8.029296875, -7.257080078125, -6.48486328125, -5.712646484375, -4.9404296875, -4.168212890625, -3.39599609375, -2.623779296875, -1.8515625, -1.079345703125, -0.30712890625, 0.465087890625, 1.2373046875, 2.009521484375, 2.78173828125, 3.553955078125, 4.326171875, 5.098388671875, 5.87060546875, 6.642822265625, 7.4150390625, 8.187255859375, 8.95947265625, 9.731689453125, 10.50390625, 11.276123046875, 12.04833984375, 12.820556640625, 13.5927734375, 14.364990234375, 15.13720703125, 15.909423828125, 16.681640625, 17.453857421875, 18.22607421875, 18.998291015625, 19.7705078125, 20.542724609375, 21.31494140625, 22.087158203125, 22.859375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 10.0, 144.0, 560.0, 282.0, 19.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-102.21324920654297, -100.40779113769531, -98.60233306884766, -96.796875, -94.99141693115234, -93.18595886230469, -91.38050079345703, -89.57504272460938, -87.76958465576172, -85.96412658691406, -84.1586685180664, -82.35321044921875, -80.5477523803711, -78.74229431152344, -76.93683624267578, -75.13137817382812, -73.32592010498047, -71.52046203613281, -69.71500396728516, -67.9095458984375, -66.10408782958984, -64.29862976074219, -62.49317169189453, -60.687713623046875, -58.882259368896484, -57.07680130004883, -55.27134323120117, -53.465885162353516, -51.66042709350586, -49.8549690246582, -48.04951095581055, -46.24405288696289, -44.43859100341797, -42.63313293457031, -40.827674865722656, -39.022216796875, -37.216758728027344, -35.41130065917969, -33.60584259033203, -31.800384521484375, -29.994930267333984, -28.189472198486328, -26.384014129638672, -24.578556060791016, -22.77309799194336, -20.967639923095703, -19.162181854248047, -17.35672378540039, -15.551265716552734, -13.745807647705078, -11.940349578857422, -10.134891510009766, -8.32943344116211, -6.5239763259887695, -4.718518257141113, -2.913060188293457, -1.1076021194458008, 0.6978558301925659, 2.5033137798309326, 4.30877161026001, 6.114229679107666, 7.919687271118164, 9.72514533996582, 11.530603408813477, 13.336061477661133]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 7.0, 11.0, 10.0, 9.0, 8.0, 9.0, 15.0, 9.0, 10.0, 24.0, 15.0, 31.0, 19.0, 37.0, 16.0, 27.0, 30.0, 23.0, 31.0, 32.0, 32.0, 41.0, 32.0, 41.0, 44.0, 43.0, 36.0, 38.0, 25.0, 42.0, 27.0, 30.0, 26.0, 19.0, 21.0, 24.0, 18.0, 16.0, 19.0, 6.0, 9.0, 9.0, 7.0, 4.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.81233024597168, -17.27786636352539, -16.7434024810791, -16.208938598632812, -15.674473762512207, -15.140008926391602, -14.605545043945312, -14.071081161499023, -13.536617279052734, -13.002153396606445, -12.46768856048584, -11.93322467803955, -11.398760795593262, -10.864295959472656, -10.329832077026367, -9.795368194580078, -9.260903358459473, -8.726439476013184, -8.191974639892578, -7.657510757446289, -7.123046875, -6.588582515716553, -6.0541181564331055, -5.519654273986816, -4.985189914703369, -4.450725555419922, -3.916261672973633, -3.3817973136901855, -2.8473331928253174, -2.312869071960449, -1.778404712677002, -1.2439405918121338, -0.7094764709472656, -0.17501229047775269, 0.35945188999176025, 0.893916130065918, 1.4283802509307861, 1.9628443717956543, 2.4973087310791016, 3.0317728519439697, 3.566236972808838, 4.100701332092285, 4.635165214538574, 5.1696295738220215, 5.704093933105469, 6.238557815551758, 6.773022174835205, 7.307486534118652, 7.841950416564941, 8.37641429901123, 8.910879135131836, 9.445343017578125, 9.979806900024414, 10.514270782470703, 11.048735618591309, 11.583199501037598, 12.117664337158203, 12.652128219604492, 13.186593055725098, 13.721056938171387, 14.255520820617676, 14.789985656738281, 15.32444953918457, 15.85891342163086, 16.39337730407715]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 4.0, 6.0, 6.0, 6.0, 6.0, 9.0, 12.0, 13.0, 12.0, 13.0, 10.0, 16.0, 27.0, 29.0, 32.0, 22.0, 25.0, 28.0, 31.0, 40.0, 40.0, 35.0, 40.0, 40.0, 39.0, 35.0, 33.0, 33.0, 35.0, 46.0, 29.0, 24.0, 19.0, 31.0, 25.0, 23.0, 14.0, 17.0, 11.0, 13.0, 13.0, 14.0, 6.0, 5.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.6435546875, -1.5915069580078125, -1.539459228515625, -1.4874114990234375, -1.43536376953125, -1.3833160400390625, -1.331268310546875, -1.2792205810546875, -1.2271728515625, -1.1751251220703125, -1.123077392578125, -1.0710296630859375, -1.01898193359375, -0.9669342041015625, -0.914886474609375, -0.8628387451171875, -0.810791015625, -0.7587432861328125, -0.706695556640625, -0.6546478271484375, -0.60260009765625, -0.5505523681640625, -0.498504638671875, -0.4464569091796875, -0.3944091796875, -0.3423614501953125, -0.290313720703125, -0.2382659912109375, -0.18621826171875, -0.1341705322265625, -0.082122802734375, -0.0300750732421875, 0.02197265625, 0.0740203857421875, 0.126068115234375, 0.1781158447265625, 0.23016357421875, 0.2822113037109375, 0.334259033203125, 0.3863067626953125, 0.4383544921875, 0.4904022216796875, 0.542449951171875, 0.5944976806640625, 0.64654541015625, 0.6985931396484375, 0.750640869140625, 0.8026885986328125, 0.854736328125, 0.9067840576171875, 0.958831787109375, 1.0108795166015625, 1.06292724609375, 1.1149749755859375, 1.167022705078125, 1.2190704345703125, 1.2711181640625, 1.3231658935546875, 1.375213623046875, 1.4272613525390625, 1.47930908203125, 1.5313568115234375, 1.583404541015625, 1.6354522705078125, 1.6875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 6.0, 17.0, 14.0, 17.0, 28.0, 36.0, 46.0, 74.0, 99.0, 139.0, 222.0, 333.0, 559.0, 1021.0, 2093.0, 4759.0, 11658.0, 32405.0, 101002.0, 333404.0, 909759.0, 1400407.0, 902799.0, 336663.0, 102817.0, 32302.0, 11773.0, 4868.0, 2208.0, 1127.0, 540.0, 329.0, 216.0, 149.0, 96.0, 84.0, 58.0, 30.0, 23.0, 24.0, 13.0, 15.0, 13.0, 3.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.27734375, -2.207275390625, -2.13720703125, -2.067138671875, -1.9970703125, -1.927001953125, -1.85693359375, -1.786865234375, -1.716796875, -1.646728515625, -1.57666015625, -1.506591796875, -1.4365234375, -1.366455078125, -1.29638671875, -1.226318359375, -1.15625, -1.086181640625, -1.01611328125, -0.946044921875, -0.8759765625, -0.805908203125, -0.73583984375, -0.665771484375, -0.595703125, -0.525634765625, -0.45556640625, -0.385498046875, -0.3154296875, -0.245361328125, -0.17529296875, -0.105224609375, -0.03515625, 0.034912109375, 0.10498046875, 0.175048828125, 0.2451171875, 0.315185546875, 0.38525390625, 0.455322265625, 0.525390625, 0.595458984375, 0.66552734375, 0.735595703125, 0.8056640625, 0.875732421875, 0.94580078125, 1.015869140625, 1.0859375, 1.156005859375, 1.22607421875, 1.296142578125, 1.3662109375, 1.436279296875, 1.50634765625, 1.576416015625, 1.646484375, 1.716552734375, 1.78662109375, 1.856689453125, 1.9267578125, 1.996826171875, 2.06689453125, 2.136962890625, 2.20703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 12.0, 11.0, 7.0, 10.0, 19.0, 25.0, 47.0, 45.0, 69.0, 98.0, 130.0, 170.0, 216.0, 263.0, 356.0, 395.0, 406.0, 337.0, 271.0, 259.0, 208.0, 188.0, 137.0, 94.0, 65.0, 49.0, 51.0, 30.0, 24.0, 24.0, 18.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.91400146484375, -3.7811279296875, -3.64825439453125, -3.515380859375, -3.38250732421875, -3.2496337890625, -3.11676025390625, -2.98388671875, -2.85101318359375, -2.7181396484375, -2.58526611328125, -2.452392578125, -2.31951904296875, -2.1866455078125, -2.05377197265625, -1.9208984375, -1.78802490234375, -1.6551513671875, -1.52227783203125, -1.389404296875, -1.25653076171875, -1.1236572265625, -0.99078369140625, -0.85791015625, -0.72503662109375, -0.5921630859375, -0.45928955078125, -0.326416015625, -0.19354248046875, -0.0606689453125, 0.07220458984375, 0.205078125, 0.33795166015625, 0.4708251953125, 0.60369873046875, 0.736572265625, 0.86944580078125, 1.0023193359375, 1.13519287109375, 1.26806640625, 1.40093994140625, 1.5338134765625, 1.66668701171875, 1.799560546875, 1.93243408203125, 2.0653076171875, 2.19818115234375, 2.3310546875, 2.46392822265625, 2.5968017578125, 2.72967529296875, 2.862548828125, 2.99542236328125, 3.1282958984375, 3.26116943359375, 3.39404296875, 3.52691650390625, 3.6597900390625, 3.79266357421875, 3.925537109375, 4.05841064453125, 4.1912841796875, 4.32415771484375, 4.45703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 11.0, 25.0, 25.0, 42.0, 48.0, 60.0, 67.0, 115.0, 218.0, 460.0, 1619.0, 12262.0, 310012.0, 3470945.0, 381343.0, 14146.0, 1695.0, 510.0, 221.0, 130.0, 96.0, 61.0, 41.0, 23.0, 19.0, 19.0, 18.0, 9.0, 12.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.10498046875, -10.7412109375, -10.37744140625, -10.013671875, -9.64990234375, -9.2861328125, -8.92236328125, -8.55859375, -8.19482421875, -7.8310546875, -7.46728515625, -7.103515625, -6.73974609375, -6.3759765625, -6.01220703125, -5.6484375, -5.28466796875, -4.9208984375, -4.55712890625, -4.193359375, -3.82958984375, -3.4658203125, -3.10205078125, -2.73828125, -2.37451171875, -2.0107421875, -1.64697265625, -1.283203125, -0.91943359375, -0.5556640625, -0.19189453125, 0.171875, 0.53564453125, 0.8994140625, 1.26318359375, 1.626953125, 1.99072265625, 2.3544921875, 2.71826171875, 3.08203125, 3.44580078125, 3.8095703125, 4.17333984375, 4.537109375, 4.90087890625, 5.2646484375, 5.62841796875, 5.9921875, 6.35595703125, 6.7197265625, 7.08349609375, 7.447265625, 7.81103515625, 8.1748046875, 8.53857421875, 8.90234375, 9.26611328125, 9.6298828125, 9.99365234375, 10.357421875, 10.72119140625, 11.0849609375, 11.44873046875, 11.8125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 22.0, 68.0, 182.0, 252.0, 216.0, 158.0, 75.0, 23.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.831392288208008, -13.320860862731934, -11.81032943725586, -10.299797058105469, -8.789265632629395, -7.27873420715332, -5.76820182800293, -4.2576704025268555, -2.7471389770507812, -1.236607313156128, 0.2739243507385254, 1.7844562530517578, 3.294987678527832, 4.805519104003906, 6.316051483154297, 7.826582908630371, 9.337114334106445, 10.84764575958252, 12.358177185058594, 13.868709564208984, 15.379240989685059, 16.889772415161133, 18.400304794311523, 19.91083526611328, 21.421367645263672, 22.931900024414062, 24.44243049621582, 25.95296287536621, 27.46349334716797, 28.97402572631836, 30.48455810546875, 31.99509048461914, 33.50562286376953, 35.01615524291992, 36.52668762207031, 38.03721618652344, 39.54774856567383, 41.05828094482422, 42.56881332397461, 44.079345703125, 45.589874267578125, 47.100406646728516, 48.610939025878906, 50.12146759033203, 51.63199996948242, 53.14253234863281, 54.6530647277832, 56.163597106933594, 57.674129486083984, 59.184661865234375, 60.695194244384766, 62.205726623535156, 63.71625518798828, 65.22679138183594, 66.73731994628906, 68.24784851074219, 69.75838470458984, 71.26891326904297, 72.77944946289062, 74.28997802734375, 75.8005142211914, 77.31104278564453, 78.82157897949219, 80.33210754394531, 81.84263610839844]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 10.0, 4.0, 5.0, 11.0, 14.0, 8.0, 19.0, 15.0, 20.0, 27.0, 27.0, 26.0, 23.0, 49.0, 39.0, 50.0, 43.0, 52.0, 37.0, 45.0, 49.0, 47.0, 36.0, 38.0, 32.0, 31.0, 29.0, 33.0, 30.0, 23.0, 27.0, 19.0, 22.0, 7.0, 10.0, 8.0, 6.0, 13.0, 7.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.446765899658203, -16.941373825073242, -16.43597984313965, -15.930586814880371, -15.425193786621094, -14.919801712036133, -14.414408683776855, -13.909015655517578, -13.4036226272583, -12.898229598999023, -12.392836570739746, -11.887443542480469, -11.382051467895508, -10.876657485961914, -10.371265411376953, -9.865872383117676, -9.360479354858398, -8.855086326599121, -8.349693298339844, -7.844300746917725, -7.338907718658447, -6.83351469039917, -6.328122138977051, -5.822729110717773, -5.317336082458496, -4.811943054199219, -4.306550025939941, -3.8011574745178223, -3.295764446258545, -2.7903714179992676, -2.2849786281585693, -1.779585838317871, -1.2741947174072266, -0.7688018083572388, -0.263408899307251, 0.24198400974273682, 0.7473769187927246, 1.252769947052002, 1.7581627368927002, 2.2635555267333984, 2.768948554992676, 3.274341583251953, 3.7797343730926514, 4.28512716293335, 4.790520191192627, 5.295913219451904, 5.801305770874023, 6.306698799133301, 6.812091827392578, 7.3174848556518555, 7.822877883911133, 8.32827091217041, 8.833663940429688, 9.339056015014648, 9.844449043273926, 10.349842071533203, 10.85523509979248, 11.360628128051758, 11.866021156311035, 12.371414184570312, 12.876806259155273, 13.382200241088867, 13.887592315673828, 14.392985343933105, 14.898378372192383]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 10.0, 15.0, 8.0, 5.0, 8.0, 15.0, 19.0, 21.0, 22.0, 33.0, 20.0, 27.0, 33.0, 26.0, 45.0, 44.0, 44.0, 38.0, 32.0, 44.0, 39.0, 38.0, 38.0, 40.0, 43.0, 31.0, 31.0, 38.0, 25.0, 23.0, 25.0, 8.0, 12.0, 16.0, 13.0, 13.0, 6.0, 8.0, 5.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7421875, -1.6841278076171875, -1.626068115234375, -1.5680084228515625, -1.50994873046875, -1.4518890380859375, -1.393829345703125, -1.3357696533203125, -1.2777099609375, -1.2196502685546875, -1.161590576171875, -1.1035308837890625, -1.04547119140625, -0.9874114990234375, -0.929351806640625, -0.8712921142578125, -0.813232421875, -0.7551727294921875, -0.697113037109375, -0.6390533447265625, -0.58099365234375, -0.5229339599609375, -0.464874267578125, -0.4068145751953125, -0.3487548828125, -0.2906951904296875, -0.232635498046875, -0.1745758056640625, -0.11651611328125, -0.0584564208984375, -0.000396728515625, 0.0576629638671875, 0.11572265625, 0.1737823486328125, 0.231842041015625, 0.2899017333984375, 0.34796142578125, 0.4060211181640625, 0.464080810546875, 0.5221405029296875, 0.5802001953125, 0.6382598876953125, 0.696319580078125, 0.7543792724609375, 0.81243896484375, 0.8704986572265625, 0.928558349609375, 0.9866180419921875, 1.044677734375, 1.1027374267578125, 1.160797119140625, 1.2188568115234375, 1.27691650390625, 1.3349761962890625, 1.393035888671875, 1.4510955810546875, 1.5091552734375, 1.5672149658203125, 1.625274658203125, 1.6833343505859375, 1.74139404296875, 1.7994537353515625, 1.857513427734375, 1.9155731201171875, 1.9736328125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 7.0, 4.0, 8.0, 14.0, 24.0, 29.0, 43.0, 66.0, 99.0, 149.0, 187.0, 312.0, 417.0, 672.0, 968.0, 1361.0, 2032.0, 2893.0, 4263.0, 6013.0, 9129.0, 13329.0, 20393.0, 31397.0, 51219.0, 87215.0, 165808.0, 283212.0, 150000.0, 80975.0, 47764.0, 29522.0, 19304.0, 12575.0, 8542.0, 5955.0, 3961.0, 2736.0, 1875.0, 1274.0, 880.0, 601.0, 449.0, 273.0, 213.0, 137.0, 96.0, 60.0, 39.0, 28.0, 14.0, 10.0, 13.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.323486328125, -0.31319427490234375, -0.3029022216796875, -0.29261016845703125, -0.282318115234375, -0.27202606201171875, -0.2617340087890625, -0.25144195556640625, -0.24114990234375, -0.23085784912109375, -0.2205657958984375, -0.21027374267578125, -0.199981689453125, -0.18968963623046875, -0.1793975830078125, -0.16910552978515625, -0.1588134765625, -0.14852142333984375, -0.1382293701171875, -0.12793731689453125, -0.117645263671875, -0.10735321044921875, -0.0970611572265625, -0.08676910400390625, -0.07647705078125, -0.06618499755859375, -0.0558929443359375, -0.04560089111328125, -0.035308837890625, -0.02501678466796875, -0.0147247314453125, -0.00443267822265625, 0.005859375, 0.01615142822265625, 0.0264434814453125, 0.03673553466796875, 0.047027587890625, 0.05731964111328125, 0.0676116943359375, 0.07790374755859375, 0.08819580078125, 0.09848785400390625, 0.1087799072265625, 0.11907196044921875, 0.129364013671875, 0.13965606689453125, 0.1499481201171875, 0.16024017333984375, 0.1705322265625, 0.18082427978515625, 0.1911163330078125, 0.20140838623046875, 0.211700439453125, 0.22199249267578125, 0.2322845458984375, 0.24257659912109375, 0.25286865234375, 0.26316070556640625, 0.2734527587890625, 0.28374481201171875, 0.294036865234375, 0.30432891845703125, 0.3146209716796875, 0.32491302490234375, 0.335205078125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 6.0, 5.0, 4.0, 4.0, 8.0, 2.0, 9.0, 10.0, 10.0, 14.0, 18.0, 27.0, 15.0, 21.0, 25.0, 32.0, 34.0, 38.0, 35.0, 29.0, 34.0, 39.0, 31.0, 1072.0, 51.0, 49.0, 36.0, 44.0, 41.0, 37.0, 34.0, 20.0, 30.0, 26.0, 22.0, 22.0, 12.0, 13.0, 16.0, 9.0, 12.0, 9.0, 7.0, 4.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2392578125, -1.2024078369140625, -1.165557861328125, -1.1287078857421875, -1.09185791015625, -1.0550079345703125, -1.018157958984375, -0.9813079833984375, -0.9444580078125, -0.9076080322265625, -0.870758056640625, -0.8339080810546875, -0.79705810546875, -0.7602081298828125, -0.723358154296875, -0.6865081787109375, -0.649658203125, -0.6128082275390625, -0.575958251953125, -0.5391082763671875, -0.50225830078125, -0.4654083251953125, -0.428558349609375, -0.3917083740234375, -0.3548583984375, -0.3180084228515625, -0.281158447265625, -0.2443084716796875, -0.20745849609375, -0.1706085205078125, -0.133758544921875, -0.0969085693359375, -0.06005859375, -0.0232086181640625, 0.013641357421875, 0.0504913330078125, 0.08734130859375, 0.1241912841796875, 0.161041259765625, 0.1978912353515625, 0.2347412109375, 0.2715911865234375, 0.308441162109375, 0.3452911376953125, 0.38214111328125, 0.4189910888671875, 0.455841064453125, 0.4926910400390625, 0.529541015625, 0.5663909912109375, 0.603240966796875, 0.6400909423828125, 0.67694091796875, 0.7137908935546875, 0.750640869140625, 0.7874908447265625, 0.8243408203125, 0.8611907958984375, 0.898040771484375, 0.9348907470703125, 0.97174072265625, 1.0085906982421875, 1.045440673828125, 1.0822906494140625, 1.119140625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 4.0, 16.0, 13.0, 26.0, 37.0, 50.0, 76.0, 99.0, 144.0, 244.0, 358.0, 489.0, 737.0, 1093.0, 1660.0, 2400.0, 3477.0, 5183.0, 7527.0, 11576.0, 17713.0, 28041.0, 45921.0, 80403.0, 155560.0, 1348125.0, 168058.0, 84978.0, 48978.0, 29454.0, 18487.0, 11909.0, 7697.0, 5224.0, 3497.0, 2412.0, 1745.0, 1183.0, 800.0, 545.0, 401.0, 258.0, 191.0, 118.0, 78.0, 47.0, 37.0, 27.0, 14.0, 9.0, 6.0, 0.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.33544921875, -0.3254508972167969, -0.31545257568359375, -0.3054542541503906, -0.2954559326171875, -0.2854576110839844, -0.27545928955078125, -0.2654609680175781, -0.255462646484375, -0.24546432495117188, -0.23546600341796875, -0.22546768188476562, -0.2154693603515625, -0.20547103881835938, -0.19547271728515625, -0.18547439575195312, -0.17547607421875, -0.16547775268554688, -0.15547943115234375, -0.14548110961914062, -0.1354827880859375, -0.12548446655273438, -0.11548614501953125, -0.10548782348632812, -0.095489501953125, -0.08549118041992188, -0.07549285888671875, -0.06549453735351562, -0.0554962158203125, -0.045497894287109375, -0.03549957275390625, -0.025501251220703125, -0.0155029296875, -0.005504608154296875, 0.00449371337890625, 0.014492034912109375, 0.0244903564453125, 0.034488677978515625, 0.04448699951171875, 0.054485321044921875, 0.064483642578125, 0.07448196411132812, 0.08448028564453125, 0.09447860717773438, 0.1044769287109375, 0.11447525024414062, 0.12447357177734375, 0.13447189331054688, 0.14447021484375, 0.15446853637695312, 0.16446685791015625, 0.17446517944335938, 0.1844635009765625, 0.19446182250976562, 0.20446014404296875, 0.21445846557617188, 0.224456787109375, 0.23445510864257812, 0.24445343017578125, 0.2544517517089844, 0.2644500732421875, 0.2744483947753906, 0.28444671630859375, 0.2944450378417969, 0.304443359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 5.0, 8.0, 9.0, 12.0, 22.0, 18.0, 17.0, 30.0, 46.0, 44.0, 62.0, 56.0, 57.0, 45.0, 59.0, 75.0, 57.0, 45.0, 44.0, 38.0, 44.0, 44.0, 34.0, 32.0, 23.0, 17.0, 4.0, 10.0, 5.0, 6.0, 2.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00025653839111328125, -0.00024934113025665283, -0.00024214386940002441, -0.000234946608543396, -0.00022774934768676758, -0.00022055208683013916, -0.00021335482597351074, -0.00020615756511688232, -0.0001989603042602539, -0.0001917630434036255, -0.00018456578254699707, -0.00017736852169036865, -0.00017017126083374023, -0.00016297399997711182, -0.0001557767391204834, -0.00014857947826385498, -0.00014138221740722656, -0.00013418495655059814, -0.00012698769569396973, -0.00011979043483734131, -0.00011259317398071289, -0.00010539591312408447, -9.819865226745605e-05, -9.100139141082764e-05, -8.380413055419922e-05, -7.66068696975708e-05, -6.940960884094238e-05, -6.221234798431396e-05, -5.501508712768555e-05, -4.781782627105713e-05, -4.062056541442871e-05, -3.342330455780029e-05, -2.6226043701171875e-05, -1.9028782844543457e-05, -1.1831521987915039e-05, -4.634261131286621e-06, 2.562999725341797e-06, 9.760260581970215e-06, 1.6957521438598633e-05, 2.415478229522705e-05, 3.135204315185547e-05, 3.854930400848389e-05, 4.5746564865112305e-05, 5.294382572174072e-05, 6.014108657836914e-05, 6.733834743499756e-05, 7.453560829162598e-05, 8.17328691482544e-05, 8.893013000488281e-05, 9.612739086151123e-05, 0.00010332465171813965, 0.00011052191257476807, 0.00011771917343139648, 0.0001249164342880249, 0.00013211369514465332, 0.00013931095600128174, 0.00014650821685791016, 0.00015370547771453857, 0.000160902738571167, 0.0001680999994277954, 0.00017529726028442383, 0.00018249452114105225, 0.00018969178199768066, 0.00019688904285430908, 0.0002040863037109375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 8.0, 10.0, 7.0, 14.0, 18.0, 19.0, 36.0, 56.0, 56.0, 76.0, 97.0, 162.0, 245.0, 448.0, 727.0, 5406.0, 984683.0, 54058.0, 986.0, 477.0, 336.0, 191.0, 108.0, 93.0, 63.0, 41.0, 30.0, 17.0, 17.0, 15.0, 14.0, 8.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0036182403564453125, -0.003487497568130493, -0.003356754779815674, -0.0032260119915008545, -0.003095269203186035, -0.002964526414871216, -0.0028337836265563965, -0.002703040838241577, -0.002572298049926758, -0.0024415552616119385, -0.002310812473297119, -0.0021800696849823, -0.0020493268966674805, -0.0019185841083526611, -0.0017878413200378418, -0.0016570985317230225, -0.0015263557434082031, -0.0013956129550933838, -0.0012648701667785645, -0.0011341273784637451, -0.0010033845901489258, -0.0008726418018341064, -0.0007418990135192871, -0.0006111562252044678, -0.00048041343688964844, -0.0003496706485748291, -0.00021892786026000977, -8.818507194519043e-05, 4.2557716369628906e-05, 0.00017330050468444824, 0.0003040432929992676, 0.0004347860813140869, 0.0005655288696289062, 0.0006962716579437256, 0.0008270144462585449, 0.0009577572345733643, 0.0010885000228881836, 0.001219242811203003, 0.0013499855995178223, 0.0014807283878326416, 0.001611471176147461, 0.0017422139644622803, 0.0018729567527770996, 0.002003699541091919, 0.0021344423294067383, 0.0022651851177215576, 0.002395927906036377, 0.0025266706943511963, 0.0026574134826660156, 0.002788156270980835, 0.0029188990592956543, 0.0030496418476104736, 0.003180384635925293, 0.0033111274242401123, 0.0034418702125549316, 0.003572613000869751, 0.0037033557891845703, 0.0038340985774993896, 0.003964841365814209, 0.004095584154129028, 0.004226326942443848, 0.004357069730758667, 0.004487812519073486, 0.004618555307388306, 0.004749298095703125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 16.0, 60.0, 96.0, 145.0, 174.0, 171.0, 154.0, 101.0, 49.0, 18.0, 10.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023732439149171114, -0.00022992145386524498, -0.00022251851623877883, -0.00021511557861231267, -0.00020771264098584652, -0.00020030970335938036, -0.0001929067657329142, -0.00018550382810644805, -0.0001781008904799819, -0.00017069795285351574, -0.0001632950152270496, -0.00015589207760058343, -0.00014848913997411728, -0.00014108620234765112, -0.00013368326472118497, -0.00012628032709471881, -0.00011887740402016789, -0.00011147446639370173, -0.00010407152876723558, -9.666859114076942e-05, -8.926565351430327e-05, -8.186271588783711e-05, -7.445978553732857e-05, -6.705684791086242e-05, -5.965391028439626e-05, -5.2250972657930106e-05, -4.484803503146395e-05, -3.74451010429766e-05, -3.0042163416510448e-05, -2.2639225790044293e-05, -1.5236291801556945e-05, -7.83335417509079e-06, -4.304311005398631e-07, 6.97250561643159e-06, 1.4375442333403043e-05, 2.1778378140879795e-05, 2.918131576734595e-05, 3.6584253393812105e-05, 4.398718738229945e-05, 5.139012500876561e-05, 5.879306263523176e-05, 6.619600026169792e-05, 7.359893788816407e-05, 8.100186823867261e-05, 8.840480586513877e-05, 9.580774349160492e-05, 0.00010321068111807108, 0.00011061361874453723, 0.00011801655637100339, 0.00012541949399746954, 0.0001328224316239357, 0.00014022536925040185, 0.000147628306876868, 0.00015503124450333416, 0.00016243418212980032, 0.00016983711975626647, 0.00017724005738273263, 0.00018464299500919878, 0.00019204593263566494, 0.0001994488702621311, 0.00020685180788859725, 0.0002142547455150634, 0.00022165768314152956, 0.00022906062076799572, 0.00023646354384254664]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 7.0, 15.0, 14.0, 18.0, 17.0, 25.0, 23.0, 18.0, 15.0, 24.0, 32.0, 28.0, 32.0, 44.0, 39.0, 42.0, 40.0, 40.0, 40.0, 42.0, 41.0, 35.0, 34.0, 38.0, 38.0, 21.0, 26.0, 27.0, 22.0, 24.0, 15.0, 14.0, 24.0, 12.0, 9.0, 12.0, 7.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00011795759201049805, -0.0001145070418715477, -0.00011105649173259735, -0.000107605941593647, -0.00010415539145469666, -0.00010070484131574631, -9.725429117679596e-05, -9.380374103784561e-05, -9.035319089889526e-05, -8.690264075994492e-05, -8.345209062099457e-05, -8.000154048204422e-05, -7.655099034309387e-05, -7.310044020414352e-05, -6.964989006519318e-05, -6.619933992624283e-05, -6.274878978729248e-05, -5.929823964834213e-05, -5.5847689509391785e-05, -5.239713937044144e-05, -4.894658923149109e-05, -4.549603909254074e-05, -4.204548895359039e-05, -3.8594938814640045e-05, -3.51443886756897e-05, -3.169383853673935e-05, -2.8243288397789e-05, -2.4792738258838654e-05, -2.1342188119888306e-05, -1.7891637980937958e-05, -1.444108784198761e-05, -1.0990537703037262e-05, -7.539987564086914e-06, -4.089437425136566e-06, -6.388872861862183e-07, 2.8116628527641296e-06, 6.2622129917144775e-06, 9.712763130664825e-06, 1.3163313269615173e-05, 1.661386340856552e-05, 2.006441354751587e-05, 2.3514963686466217e-05, 2.6965513825416565e-05, 3.0416063964366913e-05, 3.386661410331726e-05, 3.731716424226761e-05, 4.0767714381217957e-05, 4.4218264520168304e-05, 4.766881465911865e-05, 5.1119364798069e-05, 5.456991493701935e-05, 5.8020465075969696e-05, 6.147101521492004e-05, 6.492156535387039e-05, 6.837211549282074e-05, 7.182266563177109e-05, 7.527321577072144e-05, 7.872376590967178e-05, 8.217431604862213e-05, 8.562486618757248e-05, 8.907541632652283e-05, 9.252596646547318e-05, 9.597651660442352e-05, 9.942706674337387e-05, 0.00010287761688232422]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 10.0, 15.0, 8.0, 5.0, 8.0, 15.0, 19.0, 21.0, 22.0, 33.0, 20.0, 27.0, 33.0, 26.0, 45.0, 44.0, 44.0, 38.0, 32.0, 44.0, 39.0, 38.0, 38.0, 40.0, 43.0, 31.0, 31.0, 38.0, 25.0, 23.0, 25.0, 8.0, 12.0, 16.0, 13.0, 13.0, 6.0, 8.0, 5.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7421875, -1.6841278076171875, -1.626068115234375, -1.5680084228515625, -1.50994873046875, -1.4518890380859375, -1.393829345703125, -1.3357696533203125, -1.2777099609375, -1.2196502685546875, -1.161590576171875, -1.1035308837890625, -1.04547119140625, -0.9874114990234375, -0.929351806640625, -0.8712921142578125, -0.813232421875, -0.7551727294921875, -0.697113037109375, -0.6390533447265625, -0.58099365234375, -0.5229339599609375, -0.464874267578125, -0.4068145751953125, -0.3487548828125, -0.2906951904296875, -0.232635498046875, -0.1745758056640625, -0.11651611328125, -0.0584564208984375, -0.000396728515625, 0.0576629638671875, 0.11572265625, 0.1737823486328125, 0.231842041015625, 0.2899017333984375, 0.34796142578125, 0.4060211181640625, 0.464080810546875, 0.5221405029296875, 0.5802001953125, 0.6382598876953125, 0.696319580078125, 0.7543792724609375, 0.81243896484375, 0.8704986572265625, 0.928558349609375, 0.9866180419921875, 1.044677734375, 1.1027374267578125, 1.160797119140625, 1.2188568115234375, 1.27691650390625, 1.3349761962890625, 1.393035888671875, 1.4510955810546875, 1.5091552734375, 1.5672149658203125, 1.625274658203125, 1.6833343505859375, 1.74139404296875, 1.7994537353515625, 1.857513427734375, 1.9155731201171875, 1.9736328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 8.0, 4.0, 7.0, 4.0, 16.0, 13.0, 16.0, 21.0, 41.0, 59.0, 89.0, 108.0, 191.0, 292.0, 566.0, 854.0, 1601.0, 2894.0, 5706.0, 11125.0, 24271.0, 59467.0, 170982.0, 382467.0, 242565.0, 83470.0, 31876.0, 14371.0, 7031.0, 3684.0, 2058.0, 1082.0, 629.0, 342.0, 195.0, 119.0, 90.0, 80.0, 45.0, 33.0, 21.0, 20.0, 9.0, 12.0, 4.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-2.2265625, -2.15625, -2.0859375, -2.015625, -1.9453125, -1.875, -1.8046875, -1.734375, -1.6640625, -1.59375, -1.5234375, -1.453125, -1.3828125, -1.3125, -1.2421875, -1.171875, -1.1015625, -1.03125, -0.9609375, -0.890625, -0.8203125, -0.75, -0.6796875, -0.609375, -0.5390625, -0.46875, -0.3984375, -0.328125, -0.2578125, -0.1875, -0.1171875, -0.046875, 0.0234375, 0.09375, 0.1640625, 0.234375, 0.3046875, 0.375, 0.4453125, 0.515625, 0.5859375, 0.65625, 0.7265625, 0.796875, 0.8671875, 0.9375, 1.0078125, 1.078125, 1.1484375, 1.21875, 1.2890625, 1.359375, 1.4296875, 1.5, 1.5703125, 1.640625, 1.7109375, 1.78125, 1.8515625, 1.921875, 1.9921875, 2.0625, 2.1328125, 2.203125, 2.2734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 9.0, 10.0, 14.0, 17.0, 16.0, 25.0, 20.0, 35.0, 38.0, 34.0, 40.0, 62.0, 58.0, 68.0, 147.0, 324.0, 1398.0, 180.0, 88.0, 72.0, 55.0, 49.0, 29.0, 42.0, 31.0, 23.0, 31.0, 20.0, 18.0, 14.0, 13.0, 5.0, 8.0, 6.0, 5.0, 5.0, 6.0, 0.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44140625, -7.2021484375, -6.962890625, -6.7236328125, -6.484375, -6.2451171875, -6.005859375, -5.7666015625, -5.52734375, -5.2880859375, -5.048828125, -4.8095703125, -4.5703125, -4.3310546875, -4.091796875, -3.8525390625, -3.61328125, -3.3740234375, -3.134765625, -2.8955078125, -2.65625, -2.4169921875, -2.177734375, -1.9384765625, -1.69921875, -1.4599609375, -1.220703125, -0.9814453125, -0.7421875, -0.5029296875, -0.263671875, -0.0244140625, 0.21484375, 0.4541015625, 0.693359375, 0.9326171875, 1.171875, 1.4111328125, 1.650390625, 1.8896484375, 2.12890625, 2.3681640625, 2.607421875, 2.8466796875, 3.0859375, 3.3251953125, 3.564453125, 3.8037109375, 4.04296875, 4.2822265625, 4.521484375, 4.7607421875, 5.0, 5.2392578125, 5.478515625, 5.7177734375, 5.95703125, 6.1962890625, 6.435546875, 6.6748046875, 6.9140625, 7.1533203125, 7.392578125, 7.6318359375, 7.87109375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 2.0, 7.0, 17.0, 31.0, 39.0, 60.0, 108.0, 201.0, 422.0, 1783.0, 2646260.0, 494612.0, 1340.0, 364.0, 170.0, 105.0, 58.0, 37.0, 30.0, 12.0, 17.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-47.90625, -46.736083984375, -45.56591796875, -44.395751953125, -43.2255859375, -42.055419921875, -40.88525390625, -39.715087890625, -38.544921875, -37.374755859375, -36.20458984375, -35.034423828125, -33.8642578125, -32.694091796875, -31.52392578125, -30.353759765625, -29.18359375, -28.013427734375, -26.84326171875, -25.673095703125, -24.5029296875, -23.332763671875, -22.16259765625, -20.992431640625, -19.822265625, -18.652099609375, -17.48193359375, -16.311767578125, -15.1416015625, -13.971435546875, -12.80126953125, -11.631103515625, -10.4609375, -9.290771484375, -8.12060546875, -6.950439453125, -5.7802734375, -4.610107421875, -3.43994140625, -2.269775390625, -1.099609375, 0.070556640625, 1.24072265625, 2.410888671875, 3.5810546875, 4.751220703125, 5.92138671875, 7.091552734375, 8.26171875, 9.431884765625, 10.60205078125, 11.772216796875, 12.9423828125, 14.112548828125, 15.28271484375, 16.452880859375, 17.623046875, 18.793212890625, 19.96337890625, 21.133544921875, 22.3037109375, 23.473876953125, 24.64404296875, 25.814208984375, 26.984375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [796.0, 218.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.200349807739258, 0.8117284774780273, 5.8238067626953125, 10.835885047912598, 15.847963333129883, 20.86004066467285, 25.872119903564453, 30.884199142456055, 35.896278381347656, 40.908355712890625, 45.920433044433594, 50.93251419067383, 55.9445915222168, 60.956668853759766, 65.96875, 70.98082733154297, 75.99290466308594, 81.0049819946289, 86.01705932617188, 91.02913665771484, 96.04121398925781, 101.05329895019531, 106.06537628173828, 111.07745361328125, 116.08953094482422, 121.10160827636719, 126.11368560791016, 131.12576293945312, 136.13784790039062, 141.14991760253906, 146.16200256347656, 151.174072265625, 156.1861572265625, 161.1982421875, 166.21031188964844, 171.22239685058594, 176.23446655273438, 181.24655151367188, 186.2586212158203, 191.2707061767578, 196.28277587890625, 201.29486083984375, 206.3069305419922, 211.3190155029297, 216.33108520507812, 221.34317016601562, 226.35523986816406, 231.36732482910156, 236.37940979003906, 241.39149475097656, 246.403564453125, 251.4156494140625, 256.427734375, 261.4397888183594, 266.4518737792969, 271.4639587402344, 276.4760437011719, 281.4881286621094, 286.5002136230469, 291.51226806640625, 296.52435302734375, 301.53643798828125, 306.54852294921875, 311.56060791015625, 316.5726623535156]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 2.0, 4.0, 13.0, 11.0, 13.0, 18.0, 11.0, 15.0, 22.0, 25.0, 28.0, 22.0, 36.0, 37.0, 30.0, 39.0, 29.0, 39.0, 41.0, 39.0, 37.0, 35.0, 36.0, 33.0, 43.0, 38.0, 30.0, 34.0, 31.0, 24.0, 22.0, 24.0, 18.0, 17.0, 14.0, 12.0, 14.0, 12.0, 2.0, 11.0, 9.0, 4.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.929765701293945, -18.370332717895508, -17.81089973449707, -17.25146484375, -16.692031860351562, -16.132598876953125, -15.573165893554688, -15.01373291015625, -14.454298973083496, -13.894865989685059, -13.335432052612305, -12.775999069213867, -12.21656608581543, -11.657132148742676, -11.097699165344238, -10.538265228271484, -9.978832244873047, -9.41939926147461, -8.859965324401855, -8.300532341003418, -7.741098880767822, -7.181665420532227, -6.622232437133789, -6.062798976898193, -5.503365516662598, -4.943932056427002, -4.384498596191406, -3.8250656127929688, -3.265632152557373, -2.7061986923217773, -2.1467654705047607, -1.5873322486877441, -1.0278987884521484, -0.4684654474258423, 0.09096789360046387, 0.65040123462677, 1.2098345756530762, 1.7692680358886719, 2.3287012577056885, 2.888134479522705, 3.447567939758301, 4.0070013999938965, 4.566434860229492, 5.12586784362793, 5.685301303863525, 6.244734764099121, 6.804167747497559, 7.363601207733154, 7.92303466796875, 8.482467651367188, 9.041901588439941, 9.601334571838379, 10.160768508911133, 10.72020149230957, 11.279634475708008, 11.839067459106445, 12.3985013961792, 12.957934379577637, 13.51736831665039, 14.076801300048828, 14.636234283447266, 15.19566822052002, 15.755101203918457, 16.31453514099121, 16.87396812438965]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 13.0, 11.0, 13.0, 14.0, 20.0, 12.0, 31.0, 16.0, 26.0, 24.0, 29.0, 28.0, 34.0, 45.0, 35.0, 38.0, 30.0, 37.0, 39.0, 46.0, 32.0, 36.0, 48.0, 38.0, 34.0, 32.0, 27.0, 34.0, 18.0, 20.0, 19.0, 18.0, 8.0, 12.0, 13.0, 9.0, 4.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8095703125, -1.7487945556640625, -1.688018798828125, -1.6272430419921875, -1.56646728515625, -1.5056915283203125, -1.444915771484375, -1.3841400146484375, -1.3233642578125, -1.2625885009765625, -1.201812744140625, -1.1410369873046875, -1.08026123046875, -1.0194854736328125, -0.958709716796875, -0.8979339599609375, -0.837158203125, -0.7763824462890625, -0.715606689453125, -0.6548309326171875, -0.59405517578125, -0.5332794189453125, -0.472503662109375, -0.4117279052734375, -0.3509521484375, -0.2901763916015625, -0.229400634765625, -0.1686248779296875, -0.10784912109375, -0.0470733642578125, 0.013702392578125, 0.0744781494140625, 0.13525390625, 0.1960296630859375, 0.256805419921875, 0.3175811767578125, 0.37835693359375, 0.4391326904296875, 0.499908447265625, 0.5606842041015625, 0.6214599609375, 0.6822357177734375, 0.743011474609375, 0.8037872314453125, 0.86456298828125, 0.9253387451171875, 0.986114501953125, 1.0468902587890625, 1.107666015625, 1.1684417724609375, 1.229217529296875, 1.2899932861328125, 1.35076904296875, 1.4115447998046875, 1.472320556640625, 1.5330963134765625, 1.5938720703125, 1.6546478271484375, 1.715423583984375, 1.7761993408203125, 1.83697509765625, 1.8977508544921875, 1.958526611328125, 2.0193023681640625, 2.080078125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 0.0, 4.0, 15.0, 13.0, 13.0, 9.0, 17.0, 15.0, 18.0, 27.0, 40.0, 36.0, 47.0, 63.0, 84.0, 77.0, 112.0, 202.0, 393.0, 1331.0, 15589.0, 944079.0, 3130760.0, 96166.0, 3589.0, 620.0, 260.0, 145.0, 106.0, 96.0, 59.0, 54.0, 43.0, 30.0, 29.0, 16.0, 19.0, 23.0, 21.0, 13.0, 9.0, 10.0, 5.0, 3.0, 4.0, 2.0, 7.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.29443359375, -8.0107421875, -7.72705078125, -7.443359375, -7.15966796875, -6.8759765625, -6.59228515625, -6.30859375, -6.02490234375, -5.7412109375, -5.45751953125, -5.173828125, -4.89013671875, -4.6064453125, -4.32275390625, -4.0390625, -3.75537109375, -3.4716796875, -3.18798828125, -2.904296875, -2.62060546875, -2.3369140625, -2.05322265625, -1.76953125, -1.48583984375, -1.2021484375, -0.91845703125, -0.634765625, -0.35107421875, -0.0673828125, 0.21630859375, 0.5, 0.78369140625, 1.0673828125, 1.35107421875, 1.634765625, 1.91845703125, 2.2021484375, 2.48583984375, 2.76953125, 3.05322265625, 3.3369140625, 3.62060546875, 3.904296875, 4.18798828125, 4.4716796875, 4.75537109375, 5.0390625, 5.32275390625, 5.6064453125, 5.89013671875, 6.173828125, 6.45751953125, 6.7412109375, 7.02490234375, 7.30859375, 7.59228515625, 7.8759765625, 8.15966796875, 8.443359375, 8.72705078125, 9.0107421875, 9.29443359375, 9.578125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 9.0, 19.0, 26.0, 28.0, 45.0, 56.0, 88.0, 122.0, 178.0, 239.0, 341.0, 414.0, 480.0, 468.0, 407.0, 320.0, 231.0, 172.0, 137.0, 84.0, 61.0, 39.0, 35.0, 15.0, 15.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.84375, -5.67138671875, -5.4990234375, -5.32666015625, -5.154296875, -4.98193359375, -4.8095703125, -4.63720703125, -4.46484375, -4.29248046875, -4.1201171875, -3.94775390625, -3.775390625, -3.60302734375, -3.4306640625, -3.25830078125, -3.0859375, -2.91357421875, -2.7412109375, -2.56884765625, -2.396484375, -2.22412109375, -2.0517578125, -1.87939453125, -1.70703125, -1.53466796875, -1.3623046875, -1.18994140625, -1.017578125, -0.84521484375, -0.6728515625, -0.50048828125, -0.328125, -0.15576171875, 0.0166015625, 0.18896484375, 0.361328125, 0.53369140625, 0.7060546875, 0.87841796875, 1.05078125, 1.22314453125, 1.3955078125, 1.56787109375, 1.740234375, 1.91259765625, 2.0849609375, 2.25732421875, 2.4296875, 2.60205078125, 2.7744140625, 2.94677734375, 3.119140625, 3.29150390625, 3.4638671875, 3.63623046875, 3.80859375, 3.98095703125, 4.1533203125, 4.32568359375, 4.498046875, 4.67041015625, 4.8427734375, 5.01513671875, 5.1875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 17.0, 12.0, 23.0, 34.0, 56.0, 76.0, 96.0, 115.0, 206.0, 277.0, 506.0, 1288.0, 9381.0, 457966.0, 3587997.0, 129679.0, 4420.0, 909.0, 412.0, 247.0, 154.0, 97.0, 83.0, 63.0, 53.0, 32.0, 23.0, 12.0, 10.0, 15.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.78125, -13.3272705078125, -12.873291015625, -12.4193115234375, -11.96533203125, -11.5113525390625, -11.057373046875, -10.6033935546875, -10.1494140625, -9.6954345703125, -9.241455078125, -8.7874755859375, -8.33349609375, -7.8795166015625, -7.425537109375, -6.9715576171875, -6.517578125, -6.0635986328125, -5.609619140625, -5.1556396484375, -4.70166015625, -4.2476806640625, -3.793701171875, -3.3397216796875, -2.8857421875, -2.4317626953125, -1.977783203125, -1.5238037109375, -1.06982421875, -0.6158447265625, -0.161865234375, 0.2921142578125, 0.74609375, 1.2000732421875, 1.654052734375, 2.1080322265625, 2.56201171875, 3.0159912109375, 3.469970703125, 3.9239501953125, 4.3779296875, 4.8319091796875, 5.285888671875, 5.7398681640625, 6.19384765625, 6.6478271484375, 7.101806640625, 7.5557861328125, 8.009765625, 8.4637451171875, 8.917724609375, 9.3717041015625, 9.82568359375, 10.2796630859375, 10.733642578125, 11.1876220703125, 11.6416015625, 12.0955810546875, 12.549560546875, 13.0035400390625, 13.45751953125, 13.9114990234375, 14.365478515625, 14.8194580078125, 15.2734375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 74.0, 564.0, 351.0, 24.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.5766143798828, -202.94308471679688, -198.30955505371094, -193.676025390625, -189.04251098632812, -184.4089813232422, -179.77545166015625, -175.1419219970703, -170.50839233398438, -165.87486267089844, -161.2413330078125, -156.60780334472656, -151.97427368164062, -147.34075927734375, -142.7072296142578, -138.07369995117188, -133.44017028808594, -128.806640625, -124.17311096191406, -119.53958892822266, -114.90605926513672, -110.27252960205078, -105.63900756835938, -101.00547790527344, -96.3719482421875, -91.73841857910156, -87.10488891601562, -82.47136688232422, -77.83783721923828, -73.20430755615234, -68.57078552246094, -63.937255859375, -59.30372619628906, -54.670196533203125, -50.03667068481445, -45.40314483642578, -40.769615173339844, -36.136085510253906, -31.502559661865234, -26.869033813476562, -22.235504150390625, -17.60197639465332, -12.968448638916016, -8.334920883178711, -3.7013931274414062, 0.9321346282958984, 5.565662384033203, 10.199188232421875, 14.832717895507812, 19.466245651245117, 24.099773406982422, 28.733301162719727, 33.36682891845703, 38.00035858154297, 42.63388442993164, 47.26741027832031, 51.90093994140625, 56.53446960449219, 61.16799545288086, 65.80152130126953, 70.43505096435547, 75.0685806274414, 79.70210266113281, 84.33563232421875, 88.96916198730469]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 12.0, 5.0, 8.0, 13.0, 17.0, 17.0, 11.0, 15.0, 16.0, 23.0, 28.0, 20.0, 26.0, 24.0, 38.0, 32.0, 40.0, 41.0, 45.0, 46.0, 43.0, 37.0, 38.0, 38.0, 38.0, 38.0, 42.0, 26.0, 27.0, 25.0, 22.0, 18.0, 27.0, 15.0, 11.0, 17.0, 12.0, 8.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.296612739562988, -13.795836448669434, -13.295059204101562, -12.794282913208008, -12.293505668640137, -11.792729377746582, -11.291952133178711, -10.791175842285156, -10.290399551391602, -9.789623260498047, -9.288846015930176, -8.788069725036621, -8.28729248046875, -7.786516189575195, -7.285739421844482, -6.7849626541137695, -6.284185409545898, -5.7834086418151855, -5.282631874084473, -4.781855583190918, -4.281078338623047, -3.780301809310913, -3.2795252799987793, -2.7787485122680664, -2.2779717445373535, -1.7771949768066406, -1.2764183282852173, -0.775641679763794, -0.27486491203308105, 0.22591185569763184, 0.7266883850097656, 1.2274651527404785, 1.7282428741455078, 2.2290196418762207, 2.7297964096069336, 3.2305729389190674, 3.7313497066497803, 4.232126235961914, 4.732903003692627, 5.23367977142334, 5.734456539154053, 6.235233306884766, 6.7360100746154785, 7.236786842346191, 7.737563133239746, 8.238340377807617, 8.739116668701172, 9.239892959594727, 9.740670204162598, 10.241446495056152, 10.742223739624023, 11.243000030517578, 11.74377727508545, 12.244553565979004, 12.745330810546875, 13.24610710144043, 13.746883392333984, 14.247659683227539, 14.74843692779541, 15.249213218688965, 15.749990463256836, 16.25076675415039, 16.751543045043945, 17.2523193359375, 17.753097534179688]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 11.0, 10.0, 6.0, 5.0, 16.0, 13.0, 16.0, 17.0, 19.0, 24.0, 20.0, 24.0, 34.0, 32.0, 37.0, 44.0, 30.0, 29.0, 40.0, 53.0, 49.0, 33.0, 31.0, 62.0, 40.0, 31.0, 32.0, 34.0, 34.0, 19.0, 24.0, 21.0, 19.0, 16.0, 13.0, 11.0, 7.0, 7.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.88671875, -1.821563720703125, -1.75640869140625, -1.691253662109375, -1.6260986328125, -1.560943603515625, -1.49578857421875, -1.430633544921875, -1.365478515625, -1.300323486328125, -1.23516845703125, -1.170013427734375, -1.1048583984375, -1.039703369140625, -0.97454833984375, -0.909393310546875, -0.84423828125, -0.779083251953125, -0.71392822265625, -0.648773193359375, -0.5836181640625, -0.518463134765625, -0.45330810546875, -0.388153076171875, -0.322998046875, -0.257843017578125, -0.19268798828125, -0.127532958984375, -0.0623779296875, 0.002777099609375, 0.06793212890625, 0.133087158203125, 0.1982421875, 0.263397216796875, 0.32855224609375, 0.393707275390625, 0.4588623046875, 0.524017333984375, 0.58917236328125, 0.654327392578125, 0.719482421875, 0.784637451171875, 0.84979248046875, 0.914947509765625, 0.9801025390625, 1.045257568359375, 1.11041259765625, 1.175567626953125, 1.24072265625, 1.305877685546875, 1.37103271484375, 1.436187744140625, 1.5013427734375, 1.566497802734375, 1.63165283203125, 1.696807861328125, 1.761962890625, 1.827117919921875, 1.89227294921875, 1.957427978515625, 2.0225830078125, 2.087738037109375, 2.15289306640625, 2.218048095703125, 2.283203125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 14.0, 24.0, 28.0, 40.0, 51.0, 109.0, 144.0, 200.0, 320.0, 452.0, 694.0, 942.0, 1425.0, 2012.0, 3074.0, 4442.0, 6586.0, 10091.0, 15605.0, 24442.0, 40073.0, 69895.0, 134757.0, 296781.0, 199650.0, 95370.0, 52828.0, 31236.0, 19591.0, 12445.0, 8223.0, 5515.0, 3688.0, 2412.0, 1752.0, 1139.0, 781.0, 555.0, 342.0, 281.0, 172.0, 112.0, 86.0, 64.0, 33.0, 28.0, 11.0, 11.0, 9.0, 8.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.41845703125, -0.40605926513671875, -0.3936614990234375, -0.38126373291015625, -0.368865966796875, -0.35646820068359375, -0.3440704345703125, -0.33167266845703125, -0.31927490234375, -0.30687713623046875, -0.2944793701171875, -0.28208160400390625, -0.269683837890625, -0.25728607177734375, -0.2448883056640625, -0.23249053955078125, -0.2200927734375, -0.20769500732421875, -0.1952972412109375, -0.18289947509765625, -0.170501708984375, -0.15810394287109375, -0.1457061767578125, -0.13330841064453125, -0.12091064453125, -0.10851287841796875, -0.0961151123046875, -0.08371734619140625, -0.071319580078125, -0.05892181396484375, -0.0465240478515625, -0.03412628173828125, -0.021728515625, -0.00933074951171875, 0.0030670166015625, 0.01546478271484375, 0.027862548828125, 0.04026031494140625, 0.0526580810546875, 0.06505584716796875, 0.07745361328125, 0.08985137939453125, 0.1022491455078125, 0.11464691162109375, 0.127044677734375, 0.13944244384765625, 0.1518402099609375, 0.16423797607421875, 0.1766357421875, 0.18903350830078125, 0.2014312744140625, 0.21382904052734375, 0.226226806640625, 0.23862457275390625, 0.2510223388671875, 0.26342010498046875, 0.27581787109375, 0.28821563720703125, 0.3006134033203125, 0.31301116943359375, 0.325408935546875, 0.33780670166015625, 0.3502044677734375, 0.36260223388671875, 0.375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 8.0, 3.0, 4.0, 17.0, 13.0, 17.0, 16.0, 15.0, 16.0, 24.0, 43.0, 33.0, 30.0, 30.0, 37.0, 31.0, 43.0, 45.0, 39.0, 1064.0, 31.0, 45.0, 33.0, 38.0, 57.0, 27.0, 40.0, 30.0, 31.0, 27.0, 20.0, 24.0, 14.0, 11.0, 21.0, 6.0, 7.0, 6.0, 11.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.318359375, -1.2742919921875, -1.230224609375, -1.1861572265625, -1.14208984375, -1.0980224609375, -1.053955078125, -1.0098876953125, -0.9658203125, -0.9217529296875, -0.877685546875, -0.8336181640625, -0.78955078125, -0.7454833984375, -0.701416015625, -0.6573486328125, -0.61328125, -0.5692138671875, -0.525146484375, -0.4810791015625, -0.43701171875, -0.3929443359375, -0.348876953125, -0.3048095703125, -0.2607421875, -0.2166748046875, -0.172607421875, -0.1285400390625, -0.08447265625, -0.0404052734375, 0.003662109375, 0.0477294921875, 0.091796875, 0.1358642578125, 0.179931640625, 0.2239990234375, 0.26806640625, 0.3121337890625, 0.356201171875, 0.4002685546875, 0.4443359375, 0.4884033203125, 0.532470703125, 0.5765380859375, 0.62060546875, 0.6646728515625, 0.708740234375, 0.7528076171875, 0.796875, 0.8409423828125, 0.885009765625, 0.9290771484375, 0.97314453125, 1.0172119140625, 1.061279296875, 1.1053466796875, 1.1494140625, 1.1934814453125, 1.237548828125, 1.2816162109375, 1.32568359375, 1.3697509765625, 1.413818359375, 1.4578857421875, 1.501953125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 14.0, 19.0, 26.0, 32.0, 55.0, 75.0, 117.0, 163.0, 267.0, 330.0, 553.0, 757.0, 1044.0, 1630.0, 2485.0, 3699.0, 5658.0, 8495.0, 13580.0, 21556.0, 35388.0, 60776.0, 109978.0, 229462.0, 1309848.0, 120548.0, 66201.0, 38956.0, 23437.0, 14610.0, 9330.0, 5975.0, 3916.0, 2671.0, 1770.0, 1231.0, 813.0, 520.0, 361.0, 255.0, 164.0, 117.0, 82.0, 60.0, 33.0, 28.0, 12.0, 11.0, 11.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3490791320800781, -0.33707427978515625, -0.3250694274902344, -0.3130645751953125, -0.3010597229003906, -0.28905487060546875, -0.2770500183105469, -0.265045166015625, -0.2530403137207031, -0.24103546142578125, -0.22903060913085938, -0.2170257568359375, -0.20502090454101562, -0.19301605224609375, -0.18101119995117188, -0.16900634765625, -0.15700149536132812, -0.14499664306640625, -0.13299179077148438, -0.1209869384765625, -0.10898208618164062, -0.09697723388671875, -0.08497238159179688, -0.072967529296875, -0.060962677001953125, -0.04895782470703125, -0.036952972412109375, -0.0249481201171875, -0.012943267822265625, -0.00093841552734375, 0.011066436767578125, 0.0230712890625, 0.035076141357421875, 0.04708099365234375, 0.059085845947265625, 0.0710906982421875, 0.08309555053710938, 0.09510040283203125, 0.10710525512695312, 0.119110107421875, 0.13111495971679688, 0.14311981201171875, 0.15512466430664062, 0.1671295166015625, 0.17913436889648438, 0.19113922119140625, 0.20314407348632812, 0.21514892578125, 0.22715377807617188, 0.23915863037109375, 0.2511634826660156, 0.2631683349609375, 0.2751731872558594, 0.28717803955078125, 0.2991828918457031, 0.311187744140625, 0.3231925964355469, 0.33519744873046875, 0.3472023010253906, 0.3592071533203125, 0.3712120056152344, 0.38321685791015625, 0.3952217102050781, 0.4072265625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 5.0, 6.0, 7.0, 15.0, 21.0, 23.0, 24.0, 23.0, 21.0, 30.0, 39.0, 45.0, 46.0, 49.0, 56.0, 55.0, 71.0, 44.0, 59.0, 42.0, 36.0, 42.0, 33.0, 30.0, 22.0, 25.0, 21.0, 16.0, 15.0, 14.0, 7.0, 8.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.00023508071899414062, -0.00022794120013713837, -0.0002208016812801361, -0.00021366216242313385, -0.0002065226435661316, -0.00019938312470912933, -0.00019224360585212708, -0.00018510408699512482, -0.00017796456813812256, -0.0001708250492811203, -0.00016368553042411804, -0.00015654601156711578, -0.00014940649271011353, -0.00014226697385311127, -0.000135127454996109, -0.00012798793613910675, -0.00012084841728210449, -0.00011370889842510223, -0.00010656937956809998, -9.942986071109772e-05, -9.229034185409546e-05, -8.51508229970932e-05, -7.801130414009094e-05, -7.087178528308868e-05, -6.373226642608643e-05, -5.659274756908417e-05, -4.945322871208191e-05, -4.231370985507965e-05, -3.517419099807739e-05, -2.8034672141075134e-05, -2.0895153284072876e-05, -1.3755634427070618e-05, -6.616115570068359e-06, 5.234032869338989e-07, 7.662922143936157e-06, 1.4802441000938416e-05, 2.1941959857940674e-05, 2.9081478714942932e-05, 3.622099757194519e-05, 4.336051642894745e-05, 5.050003528594971e-05, 5.7639554142951965e-05, 6.477907299995422e-05, 7.191859185695648e-05, 7.905811071395874e-05, 8.6197629570961e-05, 9.333714842796326e-05, 0.00010047666728496552, 0.00010761618614196777, 0.00011475570499897003, 0.00012189522385597229, 0.00012903474271297455, 0.0001361742615699768, 0.00014331378042697906, 0.00015045329928398132, 0.00015759281814098358, 0.00016473233699798584, 0.0001718718558549881, 0.00017901137471199036, 0.00018615089356899261, 0.00019329041242599487, 0.00020042993128299713, 0.0002075694501399994, 0.00021470896899700165, 0.0002218484878540039]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 7.0, 16.0, 12.0, 25.0, 19.0, 28.0, 41.0, 52.0, 81.0, 99.0, 133.0, 224.0, 350.0, 603.0, 1453.0, 307681.0, 733709.0, 2137.0, 673.0, 385.0, 247.0, 172.0, 106.0, 68.0, 57.0, 46.0, 35.0, 22.0, 13.0, 10.0, 11.0, 12.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004329681396484375, -0.004185795783996582, -0.004041910171508789, -0.003898024559020996, -0.003754138946533203, -0.00361025333404541, -0.003466367721557617, -0.0033224821090698242, -0.0031785964965820312, -0.0030347108840942383, -0.0028908252716064453, -0.0027469396591186523, -0.0026030540466308594, -0.0024591684341430664, -0.0023152828216552734, -0.0021713972091674805, -0.0020275115966796875, -0.0018836259841918945, -0.0017397403717041016, -0.0015958547592163086, -0.0014519691467285156, -0.0013080835342407227, -0.0011641979217529297, -0.0010203123092651367, -0.0008764266967773438, -0.0007325410842895508, -0.0005886554718017578, -0.00044476985931396484, -0.0003008842468261719, -0.0001569986343383789, -1.3113021850585938e-05, 0.00013077259063720703, 0.000274658203125, 0.00041854381561279297, 0.0005624294281005859, 0.0007063150405883789, 0.0008502006530761719, 0.0009940862655639648, 0.0011379718780517578, 0.0012818574905395508, 0.0014257431030273438, 0.0015696287155151367, 0.0017135143280029297, 0.0018573999404907227, 0.0020012855529785156, 0.0021451711654663086, 0.0022890567779541016, 0.0024329423904418945, 0.0025768280029296875, 0.0027207136154174805, 0.0028645992279052734, 0.0030084848403930664, 0.0031523704528808594, 0.0032962560653686523, 0.0034401416778564453, 0.0035840272903442383, 0.0037279129028320312, 0.0038717985153198242, 0.004015684127807617, 0.00415956974029541, 0.004303455352783203, 0.004447340965270996, 0.004591226577758789, 0.004735112190246582, 0.004878997802734375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 10.0, 29.0, 69.0, 129.0, 166.0, 217.0, 169.0, 114.0, 68.0, 24.0, 14.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002702518249861896, -0.00026107270969077945, -0.0002518935943953693, -0.00024271449365187436, -0.00023353539290837944, -0.00022435627761296928, -0.00021517716231755912, -0.00020599804702214897, -0.00019681894627865404, -0.00018763983098324388, -0.00017846073023974895, -0.0001692816149443388, -0.00016010249964892864, -0.00015092339890543371, -0.00014174428361002356, -0.00013256518286652863, -0.00012338606757111847, -0.00011420695955166593, -0.00010502785153221339, -9.584873623680323e-05, -8.666962821735069e-05, -7.749052019789815e-05, -6.8311404902488e-05, -5.913229688303545e-05, -4.995318886358291e-05, -4.077408084413037e-05, -3.159496918669902e-05, -2.2415859348257072e-05, -1.3236749509815127e-05, -4.057641490362585e-06, 5.1214701670687646e-06, 1.4300581824500114e-05, 2.3479689843952656e-05, 3.26587978634052e-05, 4.183790952083655e-05, 5.1017021178267896e-05, 6.019612919772044e-05, 6.937523721717298e-05, 7.855435251258314e-05, 8.773346053203568e-05, 9.691256855148822e-05, 0.00010609167657094076, 0.0001152707845903933, 0.00012444989988580346, 0.00013362901518121362, 0.00014280811592470855, 0.0001519872312201187, 0.00016116633196361363, 0.00017034544725902379, 0.00017952456255443394, 0.00018870366329792887, 0.00019788277859333903, 0.00020706187933683395, 0.0002162409946322441, 0.00022542010992765427, 0.00023459922522306442, 0.00024377832596655935, 0.0002529574267100543, 0.00026213654200546443, 0.0002713156573008746, 0.00028049477259628475, 0.00028967385878786445, 0.0002988529740832746, 0.00030803208937868476, 0.0003172112046740949]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 8.0, 3.0, 4.0, 13.0, 5.0, 7.0, 14.0, 21.0, 26.0, 8.0, 19.0, 20.0, 27.0, 19.0, 32.0, 21.0, 28.0, 21.0, 37.0, 42.0, 34.0, 35.0, 39.0, 40.0, 35.0, 32.0, 32.0, 42.0, 37.0, 34.0, 22.0, 27.0, 27.0, 10.0, 23.0, 21.0, 19.0, 21.0, 15.0, 8.0, 11.0, 15.0, 11.0, 4.0, 3.0, 7.0, 7.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00011897087097167969, -0.0001154458150267601, -0.00011192075908184052, -0.00010839570313692093, -0.00010487064719200134, -0.00010134559124708176, -9.782053530216217e-05, -9.429547935724258e-05, -9.0770423412323e-05, -8.724536746740341e-05, -8.372031152248383e-05, -8.019525557756424e-05, -7.667019963264465e-05, -7.314514368772507e-05, -6.962008774280548e-05, -6.60950317978859e-05, -6.256997585296631e-05, -5.904491990804672e-05, -5.5519863963127136e-05, -5.199480801820755e-05, -4.8469752073287964e-05, -4.494469612836838e-05, -4.141964018344879e-05, -3.7894584238529205e-05, -3.436952829360962e-05, -3.084447234869003e-05, -2.7319416403770447e-05, -2.379436045885086e-05, -2.0269304513931274e-05, -1.6744248569011688e-05, -1.3219192624092102e-05, -9.694136679172516e-06, -6.16908073425293e-06, -2.6440247893333435e-06, 8.810311555862427e-07, 4.406087100505829e-06, 7.931143045425415e-06, 1.1456198990345001e-05, 1.4981254935264587e-05, 1.8506310880184174e-05, 2.203136682510376e-05, 2.5556422770023346e-05, 2.9081478714942932e-05, 3.260653465986252e-05, 3.6131590604782104e-05, 3.965664654970169e-05, 4.318170249462128e-05, 4.670675843954086e-05, 5.023181438446045e-05, 5.3756870329380035e-05, 5.728192627429962e-05, 6.080698221921921e-05, 6.43320381641388e-05, 6.785709410905838e-05, 7.138215005397797e-05, 7.490720599889755e-05, 7.843226194381714e-05, 8.195731788873672e-05, 8.548237383365631e-05, 8.90074297785759e-05, 9.253248572349548e-05, 9.605754166841507e-05, 9.958259761333466e-05, 0.00010310765355825424, 0.00010663270950317383]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 11.0, 10.0, 6.0, 5.0, 16.0, 13.0, 16.0, 17.0, 19.0, 24.0, 20.0, 24.0, 34.0, 32.0, 37.0, 44.0, 30.0, 29.0, 40.0, 53.0, 49.0, 33.0, 31.0, 62.0, 40.0, 31.0, 32.0, 34.0, 34.0, 19.0, 24.0, 21.0, 19.0, 16.0, 13.0, 11.0, 7.0, 7.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.88671875, -1.821563720703125, -1.75640869140625, -1.691253662109375, -1.6260986328125, -1.560943603515625, -1.49578857421875, -1.430633544921875, -1.365478515625, -1.300323486328125, -1.23516845703125, -1.170013427734375, -1.1048583984375, -1.039703369140625, -0.97454833984375, -0.909393310546875, -0.84423828125, -0.779083251953125, -0.71392822265625, -0.648773193359375, -0.5836181640625, -0.518463134765625, -0.45330810546875, -0.388153076171875, -0.322998046875, -0.257843017578125, -0.19268798828125, -0.127532958984375, -0.0623779296875, 0.002777099609375, 0.06793212890625, 0.133087158203125, 0.1982421875, 0.263397216796875, 0.32855224609375, 0.393707275390625, 0.4588623046875, 0.524017333984375, 0.58917236328125, 0.654327392578125, 0.719482421875, 0.784637451171875, 0.84979248046875, 0.914947509765625, 0.9801025390625, 1.045257568359375, 1.11041259765625, 1.175567626953125, 1.24072265625, 1.305877685546875, 1.37103271484375, 1.436187744140625, 1.5013427734375, 1.566497802734375, 1.63165283203125, 1.696807861328125, 1.761962890625, 1.827117919921875, 1.89227294921875, 1.957427978515625, 2.0225830078125, 2.087738037109375, 2.15289306640625, 2.218048095703125, 2.283203125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 5.0, 6.0, 16.0, 12.0, 12.0, 19.0, 32.0, 58.0, 77.0, 110.0, 184.0, 276.0, 443.0, 773.0, 1291.0, 2583.0, 4604.0, 8163.0, 14784.0, 26778.0, 48868.0, 97813.0, 218782.0, 302176.0, 160426.0, 73923.0, 38330.0, 21185.0, 11916.0, 6485.0, 3614.0, 1970.0, 1077.0, 633.0, 382.0, 229.0, 151.0, 112.0, 64.0, 45.0, 36.0, 28.0, 15.0, 17.0, 14.0, 4.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.7490234375, -1.69488525390625, -1.6407470703125, -1.58660888671875, -1.532470703125, -1.47833251953125, -1.4241943359375, -1.37005615234375, -1.31591796875, -1.26177978515625, -1.2076416015625, -1.15350341796875, -1.099365234375, -1.04522705078125, -0.9910888671875, -0.93695068359375, -0.8828125, -0.82867431640625, -0.7745361328125, -0.72039794921875, -0.666259765625, -0.61212158203125, -0.5579833984375, -0.50384521484375, -0.44970703125, -0.39556884765625, -0.3414306640625, -0.28729248046875, -0.233154296875, -0.17901611328125, -0.1248779296875, -0.07073974609375, -0.0166015625, 0.03753662109375, 0.0916748046875, 0.14581298828125, 0.199951171875, 0.25408935546875, 0.3082275390625, 0.36236572265625, 0.41650390625, 0.47064208984375, 0.5247802734375, 0.57891845703125, 0.633056640625, 0.68719482421875, 0.7413330078125, 0.79547119140625, 0.849609375, 0.90374755859375, 0.9578857421875, 1.01202392578125, 1.066162109375, 1.12030029296875, 1.1744384765625, 1.22857666015625, 1.28271484375, 1.33685302734375, 1.3909912109375, 1.44512939453125, 1.499267578125, 1.55340576171875, 1.6075439453125, 1.66168212890625, 1.7158203125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 9.0, 6.0, 7.0, 15.0, 16.0, 13.0, 19.0, 19.0, 24.0, 22.0, 32.0, 41.0, 39.0, 35.0, 41.0, 55.0, 65.0, 147.0, 363.0, 1406.0, 174.0, 69.0, 52.0, 48.0, 38.0, 41.0, 39.0, 26.0, 26.0, 21.0, 22.0, 20.0, 16.0, 13.0, 11.0, 8.0, 9.0, 9.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.7578125, -8.50787353515625, -8.2579345703125, -8.00799560546875, -7.758056640625, -7.50811767578125, -7.2581787109375, -7.00823974609375, -6.75830078125, -6.50836181640625, -6.2584228515625, -6.00848388671875, -5.758544921875, -5.50860595703125, -5.2586669921875, -5.00872802734375, -4.7587890625, -4.50885009765625, -4.2589111328125, -4.00897216796875, -3.759033203125, -3.50909423828125, -3.2591552734375, -3.00921630859375, -2.75927734375, -2.50933837890625, -2.2593994140625, -2.00946044921875, -1.759521484375, -1.50958251953125, -1.2596435546875, -1.00970458984375, -0.759765625, -0.50982666015625, -0.2598876953125, -0.00994873046875, 0.239990234375, 0.48992919921875, 0.7398681640625, 0.98980712890625, 1.23974609375, 1.48968505859375, 1.7396240234375, 1.98956298828125, 2.239501953125, 2.48944091796875, 2.7393798828125, 2.98931884765625, 3.2392578125, 3.48919677734375, 3.7391357421875, 3.98907470703125, 4.239013671875, 4.48895263671875, 4.7388916015625, 4.98883056640625, 5.23876953125, 5.48870849609375, 5.7386474609375, 5.98858642578125, 6.238525390625, 6.48846435546875, 6.7384033203125, 6.98834228515625, 7.23828125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 8.0, 10.0, 5.0, 13.0, 13.0, 15.0, 17.0, 28.0, 33.0, 45.0, 69.0, 83.0, 125.0, 227.0, 397.0, 922.0, 11733.0, 3095074.0, 34483.0, 1208.0, 427.0, 229.0, 148.0, 87.0, 74.0, 44.0, 32.0, 29.0, 34.0, 14.0, 13.0, 8.0, 5.0, 9.0, 7.0, 4.0, 5.0, 3.0, 5.0, 0.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.59375, -27.716552734375, -26.83935546875, -25.962158203125, -25.0849609375, -24.207763671875, -23.33056640625, -22.453369140625, -21.576171875, -20.698974609375, -19.82177734375, -18.944580078125, -18.0673828125, -17.190185546875, -16.31298828125, -15.435791015625, -14.55859375, -13.681396484375, -12.80419921875, -11.927001953125, -11.0498046875, -10.172607421875, -9.29541015625, -8.418212890625, -7.541015625, -6.663818359375, -5.78662109375, -4.909423828125, -4.0322265625, -3.155029296875, -2.27783203125, -1.400634765625, -0.5234375, 0.353759765625, 1.23095703125, 2.108154296875, 2.9853515625, 3.862548828125, 4.73974609375, 5.616943359375, 6.494140625, 7.371337890625, 8.24853515625, 9.125732421875, 10.0029296875, 10.880126953125, 11.75732421875, 12.634521484375, 13.51171875, 14.388916015625, 15.26611328125, 16.143310546875, 17.0205078125, 17.897705078125, 18.77490234375, 19.652099609375, 20.529296875, 21.406494140625, 22.28369140625, 23.160888671875, 24.0380859375, 24.915283203125, 25.79248046875, 26.669677734375, 27.546875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 25.0, 33.0, 60.0, 99.0, 115.0, 149.0, 142.0, 133.0, 91.0, 72.0, 38.0, 16.0, 8.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.52664566040039, -14.085351943969727, -13.644058227539062, -13.202764511108398, -12.761470794677734, -12.32017707824707, -11.878883361816406, -11.437589645385742, -10.996295928955078, -10.555002212524414, -10.11370849609375, -9.672414779663086, -9.231121063232422, -8.789827346801758, -8.348533630371094, -7.9072394371032715, -7.465945243835449, -7.024651527404785, -6.583357810974121, -6.142064094543457, -5.700770378112793, -5.259476661682129, -4.818182468414307, -4.376888751983643, -3.9355950355529785, -3.4943013191223145, -3.0530076026916504, -2.6117136478424072, -2.170419931411743, -1.729126214981079, -1.287832260131836, -0.8465385437011719, -0.4052457809448242, 0.03604799509048462, 0.47734177112579346, 0.9186356067657471, 1.3599293231964111, 1.8012230396270752, 2.2425169944763184, 2.6838107109069824, 3.1251044273376465, 3.5663981437683105, 4.007691860198975, 4.448986053466797, 4.890279769897461, 5.331573486328125, 5.772867202758789, 6.214160919189453, 6.655454635620117, 7.096748352050781, 7.538042068481445, 7.979335784912109, 8.420629501342773, 8.861923217773438, 9.303216934204102, 9.744510650634766, 10.18580436706543, 10.627098083496094, 11.068391799926758, 11.509685516357422, 11.950979232788086, 12.39227294921875, 12.833566665649414, 13.274860382080078, 13.716155052185059]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 15.0, 10.0, 7.0, 22.0, 23.0, 19.0, 22.0, 24.0, 34.0, 23.0, 30.0, 32.0, 33.0, 26.0, 39.0, 35.0, 41.0, 36.0, 36.0, 38.0, 35.0, 31.0, 34.0, 30.0, 36.0, 34.0, 24.0, 29.0, 24.0, 21.0, 27.0, 26.0, 25.0, 9.0, 9.0, 10.0, 12.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.539243698120117, -21.860074996948242, -21.180908203125, -20.501739501953125, -19.82257080078125, -19.143402099609375, -18.4642333984375, -17.785066604614258, -17.105897903442383, -16.426729202270508, -15.74756145477295, -15.06839370727539, -14.389225006103516, -13.71005630493164, -13.030888557434082, -12.351720809936523, -11.672552108764648, -10.993383407592773, -10.314215660095215, -9.635047912597656, -8.955879211425781, -8.276710510253906, -7.597542762756348, -6.918374538421631, -6.239206314086914, -5.560038089752197, -4.8808698654174805, -4.201701641082764, -3.522533416748047, -2.84336519241333, -2.1641969680786133, -1.4850287437438965, -0.8058586120605469, -0.12669038772583008, 0.5524778366088867, 1.2316460609436035, 1.9108142852783203, 2.589982509613037, 3.269150733947754, 3.9483189582824707, 4.6274871826171875, 5.306655406951904, 5.985823631286621, 6.664991855621338, 7.344160079956055, 8.02332878112793, 8.702496528625488, 9.381664276123047, 10.060832977294922, 10.740001678466797, 11.419169425964355, 12.098337173461914, 12.777505874633789, 13.456674575805664, 14.135842323303223, 14.815010070800781, 15.494178771972656, 16.17334747314453, 16.852516174316406, 17.53168296813965, 18.210851669311523, 18.8900203704834, 19.56918716430664, 20.248355865478516, 20.92752456665039]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 12.0, 12.0, 9.0, 10.0, 14.0, 15.0, 16.0, 22.0, 21.0, 19.0, 28.0, 33.0, 25.0, 38.0, 33.0, 30.0, 45.0, 38.0, 46.0, 30.0, 43.0, 38.0, 50.0, 48.0, 40.0, 35.0, 25.0, 32.0, 29.0, 18.0, 17.0, 17.0, 16.0, 17.0, 13.0, 6.0, 12.0, 7.0, 8.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9931640625, -1.9227142333984375, -1.852264404296875, -1.7818145751953125, -1.71136474609375, -1.6409149169921875, -1.570465087890625, -1.5000152587890625, -1.4295654296875, -1.3591156005859375, -1.288665771484375, -1.2182159423828125, -1.14776611328125, -1.0773162841796875, -1.006866455078125, -0.9364166259765625, -0.865966796875, -0.7955169677734375, -0.725067138671875, -0.6546173095703125, -0.58416748046875, -0.5137176513671875, -0.443267822265625, -0.3728179931640625, -0.3023681640625, -0.2319183349609375, -0.161468505859375, -0.0910186767578125, -0.02056884765625, 0.0498809814453125, 0.120330810546875, 0.1907806396484375, 0.26123046875, 0.3316802978515625, 0.402130126953125, 0.4725799560546875, 0.54302978515625, 0.6134796142578125, 0.683929443359375, 0.7543792724609375, 0.8248291015625, 0.8952789306640625, 0.965728759765625, 1.0361785888671875, 1.10662841796875, 1.1770782470703125, 1.247528076171875, 1.3179779052734375, 1.388427734375, 1.4588775634765625, 1.529327392578125, 1.5997772216796875, 1.67022705078125, 1.7406768798828125, 1.811126708984375, 1.8815765380859375, 1.9520263671875, 2.0224761962890625, 2.092926025390625, 2.1633758544921875, 2.23382568359375, 2.3042755126953125, 2.374725341796875, 2.4451751708984375, 2.515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 8.0, 16.0, 15.0, 14.0, 23.0, 21.0, 37.0, 48.0, 95.0, 152.0, 236.0, 398.0, 991.0, 2955.0, 13246.0, 90253.0, 644746.0, 2020426.0, 1185892.0, 200123.0, 26597.0, 5053.0, 1457.0, 618.0, 296.0, 173.0, 119.0, 89.0, 54.0, 38.0, 18.0, 17.0, 18.0, 7.0, 12.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.40625, -4.271484375, -4.13671875, -4.001953125, -3.8671875, -3.732421875, -3.59765625, -3.462890625, -3.328125, -3.193359375, -3.05859375, -2.923828125, -2.7890625, -2.654296875, -2.51953125, -2.384765625, -2.25, -2.115234375, -1.98046875, -1.845703125, -1.7109375, -1.576171875, -1.44140625, -1.306640625, -1.171875, -1.037109375, -0.90234375, -0.767578125, -0.6328125, -0.498046875, -0.36328125, -0.228515625, -0.09375, 0.041015625, 0.17578125, 0.310546875, 0.4453125, 0.580078125, 0.71484375, 0.849609375, 0.984375, 1.119140625, 1.25390625, 1.388671875, 1.5234375, 1.658203125, 1.79296875, 1.927734375, 2.0625, 2.197265625, 2.33203125, 2.466796875, 2.6015625, 2.736328125, 2.87109375, 3.005859375, 3.140625, 3.275390625, 3.41015625, 3.544921875, 3.6796875, 3.814453125, 3.94921875, 4.083984375, 4.21875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 10.0, 13.0, 16.0, 28.0, 54.0, 58.0, 91.0, 162.0, 232.0, 310.0, 431.0, 513.0, 535.0, 490.0, 369.0, 271.0, 171.0, 109.0, 66.0, 61.0, 26.0, 24.0, 15.0, 5.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -5.99774169921875, -5.7767333984375, -5.55572509765625, -5.334716796875, -5.11370849609375, -4.8927001953125, -4.67169189453125, -4.45068359375, -4.22967529296875, -4.0086669921875, -3.78765869140625, -3.566650390625, -3.34564208984375, -3.1246337890625, -2.90362548828125, -2.6826171875, -2.46160888671875, -2.2406005859375, -2.01959228515625, -1.798583984375, -1.57757568359375, -1.3565673828125, -1.13555908203125, -0.91455078125, -0.69354248046875, -0.4725341796875, -0.25152587890625, -0.030517578125, 0.19049072265625, 0.4114990234375, 0.63250732421875, 0.853515625, 1.07452392578125, 1.2955322265625, 1.51654052734375, 1.737548828125, 1.95855712890625, 2.1795654296875, 2.40057373046875, 2.62158203125, 2.84259033203125, 3.0635986328125, 3.28460693359375, 3.505615234375, 3.72662353515625, 3.9476318359375, 4.16864013671875, 4.3896484375, 4.61065673828125, 4.8316650390625, 5.05267333984375, 5.273681640625, 5.49468994140625, 5.7156982421875, 5.93670654296875, 6.15771484375, 6.37872314453125, 6.5997314453125, 6.82073974609375, 7.041748046875, 7.26275634765625, 7.4837646484375, 7.70477294921875, 7.92578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 7.0, 9.0, 17.0, 16.0, 30.0, 41.0, 75.0, 72.0, 124.0, 165.0, 284.0, 550.0, 1624.0, 16959.0, 1029131.0, 3072042.0, 68404.0, 2931.0, 776.0, 362.0, 191.0, 128.0, 82.0, 78.0, 55.0, 43.0, 29.0, 17.0, 11.0, 7.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.21875, -14.7735595703125, -14.328369140625, -13.8831787109375, -13.43798828125, -12.9927978515625, -12.547607421875, -12.1024169921875, -11.6572265625, -11.2120361328125, -10.766845703125, -10.3216552734375, -9.87646484375, -9.4312744140625, -8.986083984375, -8.5408935546875, -8.095703125, -7.6505126953125, -7.205322265625, -6.7601318359375, -6.31494140625, -5.8697509765625, -5.424560546875, -4.9793701171875, -4.5341796875, -4.0889892578125, -3.643798828125, -3.1986083984375, -2.75341796875, -2.3082275390625, -1.863037109375, -1.4178466796875, -0.97265625, -0.5274658203125, -0.082275390625, 0.3629150390625, 0.80810546875, 1.2532958984375, 1.698486328125, 2.1436767578125, 2.5888671875, 3.0340576171875, 3.479248046875, 3.9244384765625, 4.36962890625, 4.8148193359375, 5.260009765625, 5.7052001953125, 6.150390625, 6.5955810546875, 7.040771484375, 7.4859619140625, 7.93115234375, 8.3763427734375, 8.821533203125, 9.2667236328125, 9.7119140625, 10.1571044921875, 10.602294921875, 11.0474853515625, 11.49267578125, 11.9378662109375, 12.383056640625, 12.8282470703125, 13.2734375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 17.0, 26.0, 71.0, 124.0, 202.0, 229.0, 168.0, 88.0, 57.0, 21.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.436946868896484, -42.96480178833008, -41.49265670776367, -40.0205078125, -38.548362731933594, -37.07621765136719, -35.60407257080078, -34.131927490234375, -32.65978240966797, -31.187637329101562, -29.715490341186523, -28.243345260620117, -26.77120018005371, -25.299053192138672, -23.826908111572266, -22.35476303100586, -20.88261604309082, -19.410470962524414, -17.938323974609375, -16.46617889404297, -14.994033813476562, -13.52188777923584, -12.049741744995117, -10.577596664428711, -9.105450630187988, -7.633305072784424, -6.161159515380859, -4.689013481140137, -3.2168679237365723, -1.7447223663330078, -0.27257633209228516, 1.199568748474121, 2.6717147827148438, 4.143860340118408, 5.616005897521973, 7.088151931762695, 8.560297012329102, 10.032443046569824, 11.504589080810547, 12.976734161376953, 14.448880195617676, 15.921026229858398, 17.393171310424805, 18.865318298339844, 20.33746337890625, 21.809608459472656, 23.281753540039062, 24.75389862060547, 26.226045608520508, 27.698190689086914, 29.170337677001953, 30.64248275756836, 32.114627838134766, 33.58677291870117, 35.058921813964844, 36.53106689453125, 38.003211975097656, 39.47535705566406, 40.94750213623047, 42.419647216796875, 43.89179611206055, 45.36394119262695, 46.83608627319336, 48.308231353759766, 49.78037643432617]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 7.0, 8.0, 5.0, 11.0, 14.0, 15.0, 12.0, 16.0, 20.0, 24.0, 29.0, 25.0, 31.0, 34.0, 44.0, 38.0, 32.0, 24.0, 33.0, 38.0, 33.0, 42.0, 45.0, 39.0, 25.0, 43.0, 35.0, 30.0, 32.0, 23.0, 32.0, 19.0, 14.0, 12.0, 15.0, 17.0, 14.0, 17.0, 12.0, 10.0, 5.0, 7.0, 6.0, 1.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.432432174682617, -15.915843963623047, -15.399256706237793, -14.882668495178223, -14.366081237792969, -13.849493026733398, -13.332904815673828, -12.816316604614258, -12.299729347229004, -11.783141136169434, -11.26655387878418, -10.74996566772461, -10.233377456665039, -9.716790199279785, -9.200201988220215, -8.683614730834961, -8.16702651977539, -7.6504387855529785, -7.133851051330566, -6.617262840270996, -6.100675106048584, -5.584087371826172, -5.067499160766602, -4.5509114265441895, -4.034323692321777, -3.5177359580993652, -3.001147985458374, -2.484560012817383, -1.9679722785949707, -1.4513845443725586, -0.9347965717315674, -0.41820859909057617, 0.09837722778320312, 0.6149650812149048, 1.1315529346466064, 1.648140788078308, 2.1647286415100098, 2.681316375732422, 3.197904348373413, 3.7144923210144043, 4.231080055236816, 4.7476677894592285, 5.264255523681641, 5.780843734741211, 6.297431468963623, 6.814019203186035, 7.3306074142456055, 7.847195148468018, 8.36378288269043, 8.88037109375, 9.396958351135254, 9.913546562194824, 10.430133819580078, 10.946722030639648, 11.463310241699219, 11.979898452758789, 12.496485710144043, 13.013073921203613, 13.529661178588867, 14.046249389648438, 14.562837600708008, 15.079424858093262, 15.596013069152832, 16.112600326538086, 16.629188537597656]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 14.0, 13.0, 17.0, 11.0, 21.0, 11.0, 19.0, 21.0, 24.0, 23.0, 29.0, 38.0, 31.0, 40.0, 51.0, 42.0, 49.0, 41.0, 33.0, 44.0, 33.0, 46.0, 50.0, 25.0, 29.0, 32.0, 22.0, 22.0, 26.0, 16.0, 17.0, 15.0, 14.0, 10.0, 5.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0234375, -1.95208740234375, -1.8807373046875, -1.80938720703125, -1.738037109375, -1.66668701171875, -1.5953369140625, -1.52398681640625, -1.45263671875, -1.38128662109375, -1.3099365234375, -1.23858642578125, -1.167236328125, -1.09588623046875, -1.0245361328125, -0.95318603515625, -0.8818359375, -0.81048583984375, -0.7391357421875, -0.66778564453125, -0.596435546875, -0.52508544921875, -0.4537353515625, -0.38238525390625, -0.31103515625, -0.23968505859375, -0.1683349609375, -0.09698486328125, -0.025634765625, 0.04571533203125, 0.1170654296875, 0.18841552734375, 0.259765625, 0.33111572265625, 0.4024658203125, 0.47381591796875, 0.545166015625, 0.61651611328125, 0.6878662109375, 0.75921630859375, 0.83056640625, 0.90191650390625, 0.9732666015625, 1.04461669921875, 1.115966796875, 1.18731689453125, 1.2586669921875, 1.33001708984375, 1.4013671875, 1.47271728515625, 1.5440673828125, 1.61541748046875, 1.686767578125, 1.75811767578125, 1.8294677734375, 1.90081787109375, 1.97216796875, 2.04351806640625, 2.1148681640625, 2.18621826171875, 2.257568359375, 2.32891845703125, 2.4002685546875, 2.47161865234375, 2.54296875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 23.0, 30.0, 54.0, 62.0, 77.0, 136.0, 201.0, 294.0, 395.0, 549.0, 863.0, 1257.0, 1806.0, 2674.0, 3805.0, 5484.0, 8146.0, 11627.0, 17505.0, 26208.0, 40953.0, 68879.0, 124148.0, 260479.0, 206517.0, 101634.0, 57913.0, 35290.0, 22923.0, 15102.0, 10488.0, 7073.0, 4935.0, 3467.0, 2332.0, 1625.0, 1204.0, 747.0, 521.0, 325.0, 257.0, 194.0, 126.0, 72.0, 55.0, 37.0, 25.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.391845703125, -0.37953948974609375, -0.3672332763671875, -0.35492706298828125, -0.342620849609375, -0.33031463623046875, -0.3180084228515625, -0.30570220947265625, -0.29339599609375, -0.28108978271484375, -0.2687835693359375, -0.25647735595703125, -0.244171142578125, -0.23186492919921875, -0.2195587158203125, -0.20725250244140625, -0.1949462890625, -0.18264007568359375, -0.1703338623046875, -0.15802764892578125, -0.145721435546875, -0.13341522216796875, -0.1211090087890625, -0.10880279541015625, -0.09649658203125, -0.08419036865234375, -0.0718841552734375, -0.05957794189453125, -0.047271728515625, -0.03496551513671875, -0.0226593017578125, -0.01035308837890625, 0.001953125, 0.01425933837890625, 0.0265655517578125, 0.03887176513671875, 0.051177978515625, 0.06348419189453125, 0.0757904052734375, 0.08809661865234375, 0.10040283203125, 0.11270904541015625, 0.1250152587890625, 0.13732147216796875, 0.149627685546875, 0.16193389892578125, 0.1742401123046875, 0.18654632568359375, 0.1988525390625, 0.21115875244140625, 0.2234649658203125, 0.23577117919921875, 0.248077392578125, 0.26038360595703125, 0.2726898193359375, 0.28499603271484375, 0.29730224609375, 0.30960845947265625, 0.3219146728515625, 0.33422088623046875, 0.346527099609375, 0.35883331298828125, 0.3711395263671875, 0.38344573974609375, 0.395751953125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 18.0, 12.0, 15.0, 11.0, 20.0, 23.0, 22.0, 20.0, 27.0, 17.0, 30.0, 41.0, 34.0, 27.0, 28.0, 43.0, 38.0, 40.0, 1063.0, 42.0, 48.0, 27.0, 33.0, 29.0, 27.0, 30.0, 24.0, 33.0, 31.0, 18.0, 15.0, 17.0, 14.0, 11.0, 16.0, 12.0, 13.0, 10.0, 5.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-1.40234375, -1.3595123291015625, -1.316680908203125, -1.2738494873046875, -1.23101806640625, -1.1881866455078125, -1.145355224609375, -1.1025238037109375, -1.0596923828125, -1.0168609619140625, -0.974029541015625, -0.9311981201171875, -0.88836669921875, -0.8455352783203125, -0.802703857421875, -0.7598724365234375, -0.717041015625, -0.6742095947265625, -0.631378173828125, -0.5885467529296875, -0.54571533203125, -0.5028839111328125, -0.460052490234375, -0.4172210693359375, -0.3743896484375, -0.3315582275390625, -0.288726806640625, -0.2458953857421875, -0.20306396484375, -0.1602325439453125, -0.117401123046875, -0.0745697021484375, -0.03173828125, 0.0110931396484375, 0.053924560546875, 0.0967559814453125, 0.13958740234375, 0.1824188232421875, 0.225250244140625, 0.2680816650390625, 0.3109130859375, 0.3537445068359375, 0.396575927734375, 0.4394073486328125, 0.48223876953125, 0.5250701904296875, 0.567901611328125, 0.6107330322265625, 0.653564453125, 0.6963958740234375, 0.739227294921875, 0.7820587158203125, 0.82489013671875, 0.8677215576171875, 0.910552978515625, 0.9533843994140625, 0.9962158203125, 1.0390472412109375, 1.081878662109375, 1.1247100830078125, 1.16754150390625, 1.2103729248046875, 1.253204345703125, 1.2960357666015625, 1.3388671875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 7.0, 1.0, 6.0, 7.0, 12.0, 15.0, 29.0, 38.0, 58.0, 78.0, 114.0, 180.0, 223.0, 338.0, 537.0, 650.0, 1030.0, 1518.0, 2065.0, 3145.0, 4553.0, 6539.0, 9904.0, 14499.0, 22395.0, 35776.0, 57815.0, 100816.0, 205360.0, 1316894.0, 123325.0, 68614.0, 41938.0, 26310.0, 16901.0, 11258.0, 7738.0, 5136.0, 3486.0, 2381.0, 1664.0, 1194.0, 796.0, 509.0, 439.0, 272.0, 199.0, 122.0, 104.0, 57.0, 30.0, 22.0, 21.0, 13.0, 6.0, 2.0, 8.0, 1.0, 1.0, 1.0], "bins": [-0.40380859375, -0.391632080078125, -0.37945556640625, -0.367279052734375, -0.3551025390625, -0.342926025390625, -0.33074951171875, -0.318572998046875, -0.306396484375, -0.294219970703125, -0.28204345703125, -0.269866943359375, -0.2576904296875, -0.245513916015625, -0.23333740234375, -0.221160888671875, -0.208984375, -0.196807861328125, -0.18463134765625, -0.172454833984375, -0.1602783203125, -0.148101806640625, -0.13592529296875, -0.123748779296875, -0.111572265625, -0.099395751953125, -0.08721923828125, -0.075042724609375, -0.0628662109375, -0.050689697265625, -0.03851318359375, -0.026336669921875, -0.01416015625, -0.001983642578125, 0.01019287109375, 0.022369384765625, 0.0345458984375, 0.046722412109375, 0.05889892578125, 0.071075439453125, 0.083251953125, 0.095428466796875, 0.10760498046875, 0.119781494140625, 0.1319580078125, 0.144134521484375, 0.15631103515625, 0.168487548828125, 0.1806640625, 0.192840576171875, 0.20501708984375, 0.217193603515625, 0.2293701171875, 0.241546630859375, 0.25372314453125, 0.265899658203125, 0.278076171875, 0.290252685546875, 0.30242919921875, 0.314605712890625, 0.3267822265625, 0.338958740234375, 0.35113525390625, 0.363311767578125, 0.37548828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 14.0, 13.0, 18.0, 26.0, 26.0, 34.0, 35.0, 58.0, 57.0, 65.0, 76.0, 74.0, 79.0, 64.0, 61.0, 51.0, 36.0, 36.0, 34.0, 23.0, 19.0, 22.0, 11.0, 11.0, 11.0, 8.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031113624572753906, -0.00030126050114631653, -0.000291384756565094, -0.00028150901198387146, -0.0002716332674026489, -0.0002617575228214264, -0.00025188177824020386, -0.00024200603365898132, -0.0002321302890777588, -0.00022225454449653625, -0.00021237879991531372, -0.0002025030553340912, -0.00019262731075286865, -0.00018275156617164612, -0.00017287582159042358, -0.00016300007700920105, -0.00015312433242797852, -0.00014324858784675598, -0.00013337284326553345, -0.0001234970986843109, -0.00011362135410308838, -0.00010374560952186584, -9.386986494064331e-05, -8.399412035942078e-05, -7.411837577819824e-05, -6.424263119697571e-05, -5.4366886615753174e-05, -4.449114203453064e-05, -3.4615397453308105e-05, -2.473965287208557e-05, -1.4863908290863037e-05, -4.988163709640503e-06, 4.887580871582031e-06, 1.4763325452804565e-05, 2.46390700340271e-05, 3.4514814615249634e-05, 4.439055919647217e-05, 5.42663037776947e-05, 6.414204835891724e-05, 7.401779294013977e-05, 8.38935375213623e-05, 9.376928210258484e-05, 0.00010364502668380737, 0.00011352077126502991, 0.00012339651584625244, 0.00013327226042747498, 0.0001431480050086975, 0.00015302374958992004, 0.00016289949417114258, 0.0001727752387523651, 0.00018265098333358765, 0.00019252672791481018, 0.00020240247249603271, 0.00021227821707725525, 0.00022215396165847778, 0.00023202970623970032, 0.00024190545082092285, 0.0002517811954021454, 0.0002616569399833679, 0.00027153268456459045, 0.000281408429145813, 0.0002912841737270355, 0.00030115991830825806, 0.0003110356628894806, 0.0003209114074707031]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 9.0, 13.0, 12.0, 16.0, 39.0, 27.0, 65.0, 57.0, 87.0, 125.0, 213.0, 452.0, 1031.0, 49079.0, 993322.0, 2454.0, 617.0, 338.0, 212.0, 127.0, 71.0, 50.0, 35.0, 27.0, 14.0, 13.0, 13.0, 5.0, 6.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006374359130859375, -0.0061827898025512695, -0.005991220474243164, -0.005799651145935059, -0.005608081817626953, -0.005416512489318848, -0.005224943161010742, -0.005033373832702637, -0.004841804504394531, -0.004650235176086426, -0.00445866584777832, -0.004267096519470215, -0.004075527191162109, -0.003883957862854004, -0.0036923885345458984, -0.003500819206237793, -0.0033092498779296875, -0.003117680549621582, -0.0029261112213134766, -0.002734541893005371, -0.0025429725646972656, -0.00235140323638916, -0.0021598339080810547, -0.0019682645797729492, -0.0017766952514648438, -0.0015851259231567383, -0.0013935565948486328, -0.0012019872665405273, -0.0010104179382324219, -0.0008188486099243164, -0.0006272792816162109, -0.00043570995330810547, -0.000244140625, -5.257129669189453e-05, 0.00013899803161621094, 0.0003305673599243164, 0.0005221366882324219, 0.0007137060165405273, 0.0009052753448486328, 0.0010968446731567383, 0.0012884140014648438, 0.0014799833297729492, 0.0016715526580810547, 0.0018631219863891602, 0.0020546913146972656, 0.002246260643005371, 0.0024378299713134766, 0.002629399299621582, 0.0028209686279296875, 0.003012537956237793, 0.0032041072845458984, 0.003395676612854004, 0.0035872459411621094, 0.003778815269470215, 0.00397038459777832, 0.004161953926086426, 0.004353523254394531, 0.004545092582702637, 0.004736661911010742, 0.004928231239318848, 0.005119800567626953, 0.005311369895935059, 0.005502939224243164, 0.0056945085525512695, 0.005886077880859375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 31.0, 171.0, 409.0, 312.0, 78.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.001052223495207727, -0.001031066058203578, -0.0010099085047841072, -0.0009887510677799582, -0.0009675935725681484, -0.0009464360773563385, -0.0009252786403521895, -0.0009041211451403797, -0.0008829636499285698, -0.0008618061547167599, -0.000840648717712611, -0.0008194912225008011, -0.0007983337272889912, -0.0007771762320771813, -0.0007560187950730324, -0.0007348612998612225, -0.0007137038628570735, -0.0006925463676452637, -0.0006713889306411147, -0.0006502314354293048, -0.000629073940217495, -0.000607916503213346, -0.0005867590080015361, -0.0005656015127897263, -0.0005444440757855773, -0.0005232865805737674, -0.0005021291435696185, -0.0004809716483578086, -0.0004598141531459987, -0.0004386566870380193, -0.0004174992209300399, -0.00039634172571823, -0.00037518423050642014, -0.0003540267643984407, -0.00033286926918663085, -0.00031171180307865143, -0.00029055430786684155, -0.00026939684175886214, -0.0002482393756508827, -0.00022708189499098808, -0.00020592441433109343, -0.00018476693367119879, -0.00016360945301130414, -0.00014245198690332472, -0.00012129450624343008, -0.00010013702558353543, -7.897955947555602e-05, -5.782207881566137e-05, -3.6664598155766726e-05, -1.5507121133850887e-05, 5.650355888064951e-06, 2.6807829272001982e-05, 4.796530993189663e-05, 6.912279059179127e-05, 9.028025669977069e-05, 0.00011143773735966533, 0.00013259521801955998, 0.00015375269867945462, 0.00017491017933934927, 0.0001960676454473287, 0.00021722512610722333, 0.00023838260676711798, 0.0002595400728750974, 0.0002806975389830768, 0.0003018550341948867]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 13.0, 8.0, 11.0, 14.0, 16.0, 18.0, 24.0, 29.0, 19.0, 20.0, 35.0, 30.0, 48.0, 34.0, 42.0, 37.0, 54.0, 41.0, 46.0, 42.0, 46.0, 34.0, 46.0, 32.0, 41.0, 25.0, 20.0, 26.0, 11.0, 20.0, 20.0, 15.0, 17.0, 11.0, 6.0, 10.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001252293586730957, -0.00012072548270225525, -0.0001162216067314148, -0.00011171773076057434, -0.00010721385478973389, -0.00010270997881889343, -9.820610284805298e-05, -9.370222687721252e-05, -8.919835090637207e-05, -8.469447493553162e-05, -8.019059896469116e-05, -7.568672299385071e-05, -7.118284702301025e-05, -6.66789710521698e-05, -6.217509508132935e-05, -5.767121911048889e-05, -5.316734313964844e-05, -4.8663467168807983e-05, -4.415959119796753e-05, -3.9655715227127075e-05, -3.515183925628662e-05, -3.064796328544617e-05, -2.6144087314605713e-05, -2.164021134376526e-05, -1.7136335372924805e-05, -1.263245940208435e-05, -8.128583431243896e-06, -3.6247074604034424e-06, 8.791685104370117e-07, 5.383044481277466e-06, 9.88692045211792e-06, 1.4390796422958374e-05, 1.8894672393798828e-05, 2.3398548364639282e-05, 2.7902424335479736e-05, 3.240630030632019e-05, 3.6910176277160645e-05, 4.14140522480011e-05, 4.591792821884155e-05, 5.042180418968201e-05, 5.492568016052246e-05, 5.9429556131362915e-05, 6.393343210220337e-05, 6.843730807304382e-05, 7.294118404388428e-05, 7.744506001472473e-05, 8.194893598556519e-05, 8.645281195640564e-05, 9.09566879272461e-05, 9.546056389808655e-05, 9.9964439868927e-05, 0.00010446831583976746, 0.00010897219181060791, 0.00011347606778144836, 0.00011797994375228882, 0.00012248381972312927, 0.00012698769569396973, 0.00013149157166481018, 0.00013599544763565063, 0.0001404993236064911, 0.00014500319957733154, 0.000149507075548172, 0.00015401095151901245, 0.0001585148274898529, 0.00016301870346069336]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 14.0, 13.0, 17.0, 11.0, 21.0, 11.0, 18.0, 22.0, 24.0, 23.0, 29.0, 38.0, 31.0, 40.0, 51.0, 42.0, 49.0, 41.0, 33.0, 44.0, 33.0, 46.0, 50.0, 25.0, 29.0, 32.0, 22.0, 22.0, 26.0, 16.0, 17.0, 15.0, 14.0, 10.0, 5.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0234375, -1.95208740234375, -1.8807373046875, -1.80938720703125, -1.738037109375, -1.66668701171875, -1.5953369140625, -1.52398681640625, -1.45263671875, -1.38128662109375, -1.3099365234375, -1.23858642578125, -1.167236328125, -1.09588623046875, -1.0245361328125, -0.95318603515625, -0.8818359375, -0.81048583984375, -0.7391357421875, -0.66778564453125, -0.596435546875, -0.52508544921875, -0.4537353515625, -0.38238525390625, -0.31103515625, -0.23968505859375, -0.1683349609375, -0.09698486328125, -0.025634765625, 0.04571533203125, 0.1170654296875, 0.18841552734375, 0.259765625, 0.33111572265625, 0.4024658203125, 0.47381591796875, 0.545166015625, 0.61651611328125, 0.6878662109375, 0.75921630859375, 0.83056640625, 0.90191650390625, 0.9732666015625, 1.04461669921875, 1.115966796875, 1.18731689453125, 1.2586669921875, 1.33001708984375, 1.4013671875, 1.47271728515625, 1.5440673828125, 1.61541748046875, 1.686767578125, 1.75811767578125, 1.8294677734375, 1.90081787109375, 1.97216796875, 2.04351806640625, 2.1148681640625, 2.18621826171875, 2.257568359375, 2.32891845703125, 2.4002685546875, 2.47161865234375, 2.54296875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 8.0, 12.0, 29.0, 28.0, 46.0, 83.0, 109.0, 165.0, 272.0, 375.0, 746.0, 1437.0, 3049.0, 6783.0, 15015.0, 32352.0, 68894.0, 148818.0, 275635.0, 254427.0, 128304.0, 59757.0, 27843.0, 12853.0, 5893.0, 2642.0, 1285.0, 675.0, 381.0, 212.0, 150.0, 82.0, 59.0, 49.0, 25.0, 19.0, 18.0, 8.0, 9.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.087921142578125, -2.01568603515625, -1.943450927734375, -1.8712158203125, -1.798980712890625, -1.72674560546875, -1.654510498046875, -1.582275390625, -1.510040283203125, -1.43780517578125, -1.365570068359375, -1.2933349609375, -1.221099853515625, -1.14886474609375, -1.076629638671875, -1.00439453125, -0.932159423828125, -0.85992431640625, -0.787689208984375, -0.7154541015625, -0.643218994140625, -0.57098388671875, -0.498748779296875, -0.426513671875, -0.354278564453125, -0.28204345703125, -0.209808349609375, -0.1375732421875, -0.065338134765625, 0.00689697265625, 0.079132080078125, 0.1513671875, 0.223602294921875, 0.29583740234375, 0.368072509765625, 0.4403076171875, 0.512542724609375, 0.58477783203125, 0.657012939453125, 0.729248046875, 0.801483154296875, 0.87371826171875, 0.945953369140625, 1.0181884765625, 1.090423583984375, 1.16265869140625, 1.234893798828125, 1.30712890625, 1.379364013671875, 1.45159912109375, 1.523834228515625, 1.5960693359375, 1.668304443359375, 1.74053955078125, 1.812774658203125, 1.885009765625, 1.957244873046875, 2.02947998046875, 2.101715087890625, 2.1739501953125, 2.246185302734375, 2.31842041015625, 2.390655517578125, 2.462890625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 6.0, 14.0, 11.0, 11.0, 12.0, 16.0, 30.0, 31.0, 38.0, 45.0, 57.0, 68.0, 85.0, 141.0, 411.0, 1477.0, 168.0, 81.0, 57.0, 64.0, 43.0, 44.0, 33.0, 27.0, 24.0, 10.0, 9.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.9559326171875, -14.552490234375, -14.1490478515625, -13.74560546875, -13.3421630859375, -12.938720703125, -12.5352783203125, -12.1318359375, -11.7283935546875, -11.324951171875, -10.9215087890625, -10.51806640625, -10.1146240234375, -9.711181640625, -9.3077392578125, -8.904296875, -8.5008544921875, -8.097412109375, -7.6939697265625, -7.29052734375, -6.8870849609375, -6.483642578125, -6.0802001953125, -5.6767578125, -5.2733154296875, -4.869873046875, -4.4664306640625, -4.06298828125, -3.6595458984375, -3.256103515625, -2.8526611328125, -2.44921875, -2.0457763671875, -1.642333984375, -1.2388916015625, -0.83544921875, -0.4320068359375, -0.028564453125, 0.3748779296875, 0.7783203125, 1.1817626953125, 1.585205078125, 1.9886474609375, 2.39208984375, 2.7955322265625, 3.198974609375, 3.6024169921875, 4.005859375, 4.4093017578125, 4.812744140625, 5.2161865234375, 5.61962890625, 6.0230712890625, 6.426513671875, 6.8299560546875, 7.2333984375, 7.6368408203125, 8.040283203125, 8.4437255859375, 8.84716796875, 9.2506103515625, 9.654052734375, 10.0574951171875, 10.4609375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 11.0, 8.0, 12.0, 18.0, 20.0, 29.0, 26.0, 61.0, 77.0, 118.0, 189.0, 336.0, 622.0, 3461.0, 2998112.0, 140093.0, 1213.0, 485.0, 263.0, 147.0, 97.0, 68.0, 52.0, 45.0, 30.0, 27.0, 15.0, 18.0, 17.0, 5.0, 5.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.390625, -26.328857421875, -25.26708984375, -24.205322265625, -23.1435546875, -22.081787109375, -21.02001953125, -19.958251953125, -18.896484375, -17.834716796875, -16.77294921875, -15.711181640625, -14.6494140625, -13.587646484375, -12.52587890625, -11.464111328125, -10.40234375, -9.340576171875, -8.27880859375, -7.217041015625, -6.1552734375, -5.093505859375, -4.03173828125, -2.969970703125, -1.908203125, -0.846435546875, 0.21533203125, 1.277099609375, 2.3388671875, 3.400634765625, 4.46240234375, 5.524169921875, 6.5859375, 7.647705078125, 8.70947265625, 9.771240234375, 10.8330078125, 11.894775390625, 12.95654296875, 14.018310546875, 15.080078125, 16.141845703125, 17.20361328125, 18.265380859375, 19.3271484375, 20.388916015625, 21.45068359375, 22.512451171875, 23.57421875, 24.635986328125, 25.69775390625, 26.759521484375, 27.8212890625, 28.883056640625, 29.94482421875, 31.006591796875, 32.068359375, 33.130126953125, 34.19189453125, 35.253662109375, 36.3154296875, 37.377197265625, 38.43896484375, 39.500732421875, 40.5625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 10.0, 38.0, 109.0, 222.0, 303.0, 203.0, 93.0, 28.0, 10.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.79438591003418, -28.78071403503418, -27.76704216003418, -26.75337028503418, -25.73969841003418, -24.72602653503418, -23.712352752685547, -22.698680877685547, -21.685009002685547, -20.671337127685547, -19.657665252685547, -18.643993377685547, -17.630321502685547, -16.616649627685547, -15.60297679901123, -14.58930492401123, -13.575634002685547, -12.561962127685547, -11.548290252685547, -10.534618377685547, -9.520946502685547, -8.507274627685547, -7.4936017990112305, -6.4799299240112305, -5.4662580490112305, -4.4525861740112305, -3.4389140605926514, -2.4252419471740723, -1.4115700721740723, -0.39789819717407227, 0.6157741546630859, 1.629446029663086, 2.643115997314453, 3.656787872314453, 4.670459747314453, 5.684132099151611, 6.697803974151611, 7.711475849151611, 8.72514820098877, 9.73882007598877, 10.75249195098877, 11.76616382598877, 12.77983570098877, 13.793508529663086, 14.807180404663086, 15.820852279663086, 16.834524154663086, 17.848196029663086, 18.861867904663086, 19.875539779663086, 20.889211654663086, 21.902883529663086, 22.916555404663086, 23.930227279663086, 24.94390106201172, 25.95757293701172, 26.97124481201172, 27.98491668701172, 28.99858856201172, 30.01226043701172, 31.02593231201172, 32.03960418701172, 33.05327606201172, 34.06694793701172, 35.08061981201172]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 5.0, 9.0, 11.0, 17.0, 18.0, 19.0, 20.0, 15.0, 26.0, 24.0, 23.0, 33.0, 35.0, 32.0, 37.0, 41.0, 38.0, 36.0, 36.0, 49.0, 51.0, 42.0, 35.0, 35.0, 32.0, 29.0, 23.0, 28.0, 24.0, 26.0, 26.0, 20.0, 19.0, 18.0, 14.0, 7.0, 5.0, 9.0, 3.0, 4.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.522613525390625, -18.866973876953125, -18.211334228515625, -17.555696487426758, -16.900056838989258, -16.244417190551758, -15.588777542114258, -14.933137893676758, -14.277499198913574, -13.621859550476074, -12.96622085571289, -12.31058120727539, -11.65494155883789, -10.999302864074707, -10.343663215637207, -9.688024520874023, -9.032384872436523, -8.376745223999023, -7.72110652923584, -7.06546688079834, -6.409827709197998, -5.754188537597656, -5.098548889160156, -4.4429097175598145, -3.7872705459594727, -3.131631374359131, -2.47599196434021, -1.8203526735305786, -1.1647133827209473, -0.5090742111206055, 0.14656519889831543, 0.8022046089172363, 1.4578437805175781, 2.11348295211792, 2.769122362136841, 3.4247617721557617, 4.0804009437561035, 4.736040115356445, 5.391679763793945, 6.047318935394287, 6.702958106994629, 7.358597278594971, 8.014236450195312, 8.669876098632812, 9.325515747070312, 9.981154441833496, 10.636794090270996, 11.29243278503418, 11.94807243347168, 12.60371208190918, 13.259350776672363, 13.914990425109863, 14.570629119873047, 15.226268768310547, 15.881908416748047, 16.537548065185547, 17.193187713623047, 17.848827362060547, 18.504467010498047, 19.160104751586914, 19.815744400024414, 20.471384048461914, 21.127023696899414, 21.782663345336914, 22.43830108642578]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 6.0, 4.0, 7.0, 5.0, 4.0, 12.0, 11.0, 6.0, 18.0, 16.0, 22.0, 12.0, 25.0, 20.0, 19.0, 27.0, 33.0, 33.0, 32.0, 43.0, 42.0, 26.0, 40.0, 49.0, 41.0, 49.0, 44.0, 32.0, 30.0, 22.0, 38.0, 39.0, 28.0, 26.0, 18.0, 13.0, 14.0, 16.0, 13.0, 9.0, 10.0, 12.0, 6.0, 10.0, 6.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.412109375, -2.335784912109375, -2.25946044921875, -2.183135986328125, -2.1068115234375, -2.030487060546875, -1.95416259765625, -1.877838134765625, -1.801513671875, -1.725189208984375, -1.64886474609375, -1.572540283203125, -1.4962158203125, -1.419891357421875, -1.34356689453125, -1.267242431640625, -1.19091796875, -1.114593505859375, -1.03826904296875, -0.961944580078125, -0.8856201171875, -0.809295654296875, -0.73297119140625, -0.656646728515625, -0.580322265625, -0.503997802734375, -0.42767333984375, -0.351348876953125, -0.2750244140625, -0.198699951171875, -0.12237548828125, -0.046051025390625, 0.0302734375, 0.106597900390625, 0.18292236328125, 0.259246826171875, 0.3355712890625, 0.411895751953125, 0.48822021484375, 0.564544677734375, 0.640869140625, 0.717193603515625, 0.79351806640625, 0.869842529296875, 0.9461669921875, 1.022491455078125, 1.09881591796875, 1.175140380859375, 1.25146484375, 1.327789306640625, 1.40411376953125, 1.480438232421875, 1.5567626953125, 1.633087158203125, 1.70941162109375, 1.785736083984375, 1.862060546875, 1.938385009765625, 2.01470947265625, 2.091033935546875, 2.1673583984375, 2.243682861328125, 2.32000732421875, 2.396331787109375, 2.47265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 3.0, 5.0, 8.0, 12.0, 15.0, 9.0, 14.0, 20.0, 22.0, 20.0, 28.0, 25.0, 34.0, 60.0, 73.0, 144.0, 282.0, 643.0, 2787.0, 46087.0, 1621350.0, 2416521.0, 99917.0, 4383.0, 869.0, 357.0, 170.0, 98.0, 69.0, 50.0, 34.0, 21.0, 26.0, 11.0, 14.0, 9.0, 17.0, 7.0, 11.0, 11.0, 9.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.7109375, -8.4395751953125, -8.168212890625, -7.8968505859375, -7.62548828125, -7.3541259765625, -7.082763671875, -6.8114013671875, -6.5400390625, -6.2686767578125, -5.997314453125, -5.7259521484375, -5.45458984375, -5.1832275390625, -4.911865234375, -4.6405029296875, -4.369140625, -4.0977783203125, -3.826416015625, -3.5550537109375, -3.28369140625, -3.0123291015625, -2.740966796875, -2.4696044921875, -2.1982421875, -1.9268798828125, -1.655517578125, -1.3841552734375, -1.11279296875, -0.8414306640625, -0.570068359375, -0.2987060546875, -0.02734375, 0.2440185546875, 0.515380859375, 0.7867431640625, 1.05810546875, 1.3294677734375, 1.600830078125, 1.8721923828125, 2.1435546875, 2.4149169921875, 2.686279296875, 2.9576416015625, 3.22900390625, 3.5003662109375, 3.771728515625, 4.0430908203125, 4.314453125, 4.5858154296875, 4.857177734375, 5.1285400390625, 5.39990234375, 5.6712646484375, 5.942626953125, 6.2139892578125, 6.4853515625, 6.7567138671875, 7.028076171875, 7.2994384765625, 7.57080078125, 7.8421630859375, 8.113525390625, 8.3848876953125, 8.65625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 7.0, 11.0, 15.0, 22.0, 30.0, 52.0, 67.0, 92.0, 126.0, 164.0, 234.0, 306.0, 385.0, 401.0, 478.0, 389.0, 350.0, 265.0, 189.0, 125.0, 90.0, 80.0, 55.0, 40.0, 24.0, 21.0, 10.0, 14.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.17578125, -6.9925537109375, -6.809326171875, -6.6260986328125, -6.44287109375, -6.2596435546875, -6.076416015625, -5.8931884765625, -5.7099609375, -5.5267333984375, -5.343505859375, -5.1602783203125, -4.97705078125, -4.7938232421875, -4.610595703125, -4.4273681640625, -4.244140625, -4.0609130859375, -3.877685546875, -3.6944580078125, -3.51123046875, -3.3280029296875, -3.144775390625, -2.9615478515625, -2.7783203125, -2.5950927734375, -2.411865234375, -2.2286376953125, -2.04541015625, -1.8621826171875, -1.678955078125, -1.4957275390625, -1.3125, -1.1292724609375, -0.946044921875, -0.7628173828125, -0.57958984375, -0.3963623046875, -0.213134765625, -0.0299072265625, 0.1533203125, 0.3365478515625, 0.519775390625, 0.7030029296875, 0.88623046875, 1.0694580078125, 1.252685546875, 1.4359130859375, 1.619140625, 1.8023681640625, 1.985595703125, 2.1688232421875, 2.35205078125, 2.5352783203125, 2.718505859375, 2.9017333984375, 3.0849609375, 3.2681884765625, 3.451416015625, 3.6346435546875, 3.81787109375, 4.0010986328125, 4.184326171875, 4.3675537109375, 4.55078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 8.0, 3.0, 10.0, 14.0, 10.0, 22.0, 28.0, 47.0, 41.0, 68.0, 90.0, 106.0, 147.0, 203.0, 303.0, 574.0, 2231.0, 40027.0, 2164632.0, 1947216.0, 34738.0, 2103.0, 578.0, 307.0, 219.0, 153.0, 91.0, 83.0, 57.0, 59.0, 37.0, 21.0, 11.0, 12.0, 10.0, 9.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.83203125, -10.3984375, -9.96484375, -9.53125, -9.09765625, -8.6640625, -8.23046875, -7.796875, -7.36328125, -6.9296875, -6.49609375, -6.0625, -5.62890625, -5.1953125, -4.76171875, -4.328125, -3.89453125, -3.4609375, -3.02734375, -2.59375, -2.16015625, -1.7265625, -1.29296875, -0.859375, -0.42578125, 0.0078125, 0.44140625, 0.875, 1.30859375, 1.7421875, 2.17578125, 2.609375, 3.04296875, 3.4765625, 3.91015625, 4.34375, 4.77734375, 5.2109375, 5.64453125, 6.078125, 6.51171875, 6.9453125, 7.37890625, 7.8125, 8.24609375, 8.6796875, 9.11328125, 9.546875, 9.98046875, 10.4140625, 10.84765625, 11.28125, 11.71484375, 12.1484375, 12.58203125, 13.015625, 13.44921875, 13.8828125, 14.31640625, 14.75, 15.18359375, 15.6171875, 16.05078125, 16.484375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 19.0, 31.0, 63.0, 87.0, 123.0, 168.0, 169.0, 155.0, 102.0, 43.0, 27.0, 17.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.459632873535156, -26.364343643188477, -25.269054412841797, -24.173765182495117, -23.078475952148438, -21.983186721801758, -20.887897491455078, -19.7926082611084, -18.69731903076172, -17.60202980041504, -16.50674057006836, -15.41145133972168, -14.316162109375, -13.22087287902832, -12.12558364868164, -11.030294418334961, -9.935005187988281, -8.839715957641602, -7.744426727294922, -6.649137496948242, -5.5538482666015625, -4.458559036254883, -3.363269805908203, -2.2679805755615234, -1.1726913452148438, -0.07740211486816406, 1.0178871154785156, 2.1131763458251953, 3.208465576171875, 4.303754806518555, 5.399044036865234, 6.494333267211914, 7.589618682861328, 8.684907913208008, 9.780197143554688, 10.875486373901367, 11.970775604248047, 13.066064834594727, 14.161354064941406, 15.256643295288086, 16.351932525634766, 17.447221755981445, 18.542510986328125, 19.637800216674805, 20.733089447021484, 21.828378677368164, 22.923667907714844, 24.018957138061523, 25.114246368408203, 26.209535598754883, 27.304824829101562, 28.400114059448242, 29.495403289794922, 30.5906925201416, 31.68598175048828, 32.781272888183594, 33.87656021118164, 34.97184753417969, 36.067138671875, 37.16242980957031, 38.25771713256836, 39.353004455566406, 40.44829559326172, 41.54358673095703, 42.63887405395508]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 12.0, 9.0, 14.0, 18.0, 25.0, 26.0, 35.0, 36.0, 26.0, 34.0, 36.0, 39.0, 33.0, 36.0, 44.0, 43.0, 46.0, 32.0, 45.0, 40.0, 41.0, 42.0, 36.0, 33.0, 35.0, 32.0, 26.0, 16.0, 21.0, 13.0, 12.0, 11.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.082216262817383, -17.480741500854492, -16.879268646240234, -16.277793884277344, -15.676319122314453, -15.074845314025879, -14.473371505737305, -13.871896743774414, -13.27042293548584, -12.668949127197266, -12.067474365234375, -11.4660005569458, -10.864526748657227, -10.263051986694336, -9.661578178405762, -9.060104370117188, -8.458629608154297, -7.8571553230285645, -7.255681037902832, -6.654207229614258, -6.052732944488525, -5.451258659362793, -4.849784851074219, -4.248310565948486, -3.646836280822754, -3.0453619956970215, -2.443887948989868, -1.8424137830734253, -1.2409396171569824, -0.63946533203125, -0.03799128532409668, 0.5634827613830566, 1.1649551391601562, 1.7664293050765991, 2.367903470993042, 2.9693775177001953, 3.5708518028259277, 4.17232608795166, 4.773799896240234, 5.375274181365967, 5.976748466491699, 6.578222751617432, 7.179697036743164, 7.781170845031738, 8.382644653320312, 8.984119415283203, 9.585593223571777, 10.187067031860352, 10.788541793823242, 11.390015602111816, 11.991490364074707, 12.592964172363281, 13.194438934326172, 13.795912742614746, 14.39738655090332, 14.998861312866211, 15.600335121154785, 16.20180892944336, 16.80328369140625, 17.40475845336914, 18.0062313079834, 18.60770606994629, 19.20918083190918, 19.810653686523438, 20.412128448486328]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 3.0, 9.0, 5.0, 15.0, 13.0, 15.0, 14.0, 20.0, 16.0, 18.0, 20.0, 21.0, 29.0, 23.0, 30.0, 30.0, 36.0, 41.0, 44.0, 52.0, 41.0, 44.0, 40.0, 39.0, 36.0, 35.0, 33.0, 32.0, 38.0, 23.0, 20.0, 24.0, 25.0, 12.0, 10.0, 13.0, 13.0, 7.0, 12.0, 11.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.42578125, -2.35235595703125, -2.2789306640625, -2.20550537109375, -2.132080078125, -2.05865478515625, -1.9852294921875, -1.91180419921875, -1.83837890625, -1.76495361328125, -1.6915283203125, -1.61810302734375, -1.544677734375, -1.47125244140625, -1.3978271484375, -1.32440185546875, -1.2509765625, -1.17755126953125, -1.1041259765625, -1.03070068359375, -0.957275390625, -0.88385009765625, -0.8104248046875, -0.73699951171875, -0.66357421875, -0.59014892578125, -0.5167236328125, -0.44329833984375, -0.369873046875, -0.29644775390625, -0.2230224609375, -0.14959716796875, -0.076171875, -0.00274658203125, 0.0706787109375, 0.14410400390625, 0.217529296875, 0.29095458984375, 0.3643798828125, 0.43780517578125, 0.51123046875, 0.58465576171875, 0.6580810546875, 0.73150634765625, 0.804931640625, 0.87835693359375, 0.9517822265625, 1.02520751953125, 1.0986328125, 1.17205810546875, 1.2454833984375, 1.31890869140625, 1.392333984375, 1.46575927734375, 1.5391845703125, 1.61260986328125, 1.68603515625, 1.75946044921875, 1.8328857421875, 1.90631103515625, 1.979736328125, 2.05316162109375, 2.1265869140625, 2.20001220703125, 2.2734375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 10.0, 10.0, 17.0, 24.0, 37.0, 45.0, 83.0, 105.0, 149.0, 232.0, 384.0, 533.0, 819.0, 1184.0, 1723.0, 2551.0, 3651.0, 5387.0, 7826.0, 11184.0, 16615.0, 25372.0, 40039.0, 66139.0, 122234.0, 264629.0, 215312.0, 100836.0, 56405.0, 34962.0, 22674.0, 15127.0, 10316.0, 6886.0, 4774.0, 3258.0, 2317.0, 1443.0, 1045.0, 753.0, 491.0, 325.0, 229.0, 131.0, 99.0, 64.0, 47.0, 41.0, 16.0, 11.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4189453125, -0.4053688049316406, -0.39179229736328125, -0.3782157897949219, -0.3646392822265625, -0.3510627746582031, -0.33748626708984375, -0.3239097595214844, -0.310333251953125, -0.2967567443847656, -0.28318023681640625, -0.2696037292480469, -0.2560272216796875, -0.24245071411132812, -0.22887420654296875, -0.21529769897460938, -0.20172119140625, -0.18814468383789062, -0.17456817626953125, -0.16099166870117188, -0.1474151611328125, -0.13383865356445312, -0.12026214599609375, -0.10668563842773438, -0.093109130859375, -0.07953262329101562, -0.06595611572265625, -0.052379608154296875, -0.0388031005859375, -0.025226593017578125, -0.01165008544921875, 0.001926422119140625, 0.0155029296875, 0.029079437255859375, 0.04265594482421875, 0.056232452392578125, 0.0698089599609375, 0.08338546752929688, 0.09696197509765625, 0.11053848266601562, 0.124114990234375, 0.13769149780273438, 0.15126800537109375, 0.16484451293945312, 0.1784210205078125, 0.19199752807617188, 0.20557403564453125, 0.21915054321289062, 0.23272705078125, 0.24630355834960938, 0.25988006591796875, 0.2734565734863281, 0.2870330810546875, 0.3006095886230469, 0.31418609619140625, 0.3277626037597656, 0.341339111328125, 0.3549156188964844, 0.36849212646484375, 0.3820686340332031, 0.3956451416015625, 0.4092216491699219, 0.42279815673828125, 0.4363746643066406, 0.449951171875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 7.0, 7.0, 14.0, 13.0, 11.0, 9.0, 24.0, 25.0, 23.0, 20.0, 23.0, 22.0, 30.0, 24.0, 38.0, 38.0, 50.0, 37.0, 43.0, 1063.0, 42.0, 40.0, 47.0, 39.0, 36.0, 28.0, 31.0, 36.0, 18.0, 30.0, 27.0, 18.0, 21.0, 11.0, 12.0, 15.0, 7.0, 10.0, 8.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.53125, -1.4826507568359375, -1.434051513671875, -1.3854522705078125, -1.33685302734375, -1.2882537841796875, -1.239654541015625, -1.1910552978515625, -1.1424560546875, -1.0938568115234375, -1.045257568359375, -0.9966583251953125, -0.94805908203125, -0.8994598388671875, -0.850860595703125, -0.8022613525390625, -0.753662109375, -0.7050628662109375, -0.656463623046875, -0.6078643798828125, -0.55926513671875, -0.5106658935546875, -0.462066650390625, -0.4134674072265625, -0.3648681640625, -0.3162689208984375, -0.267669677734375, -0.2190704345703125, -0.17047119140625, -0.1218719482421875, -0.073272705078125, -0.0246734619140625, 0.02392578125, 0.0725250244140625, 0.121124267578125, 0.1697235107421875, 0.21832275390625, 0.2669219970703125, 0.315521240234375, 0.3641204833984375, 0.4127197265625, 0.4613189697265625, 0.509918212890625, 0.5585174560546875, 0.60711669921875, 0.6557159423828125, 0.704315185546875, 0.7529144287109375, 0.801513671875, 0.8501129150390625, 0.898712158203125, 0.9473114013671875, 0.99591064453125, 1.0445098876953125, 1.093109130859375, 1.1417083740234375, 1.1903076171875, 1.2389068603515625, 1.287506103515625, 1.3361053466796875, 1.38470458984375, 1.4333038330078125, 1.481903076171875, 1.5305023193359375, 1.5791015625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 18.0, 19.0, 28.0, 53.0, 61.0, 78.0, 130.0, 195.0, 261.0, 422.0, 662.0, 947.0, 1447.0, 2107.0, 3272.0, 4734.0, 7312.0, 11066.0, 17337.0, 27105.0, 44512.0, 75686.0, 145470.0, 1343819.0, 181949.0, 89946.0, 50980.0, 30767.0, 19588.0, 12439.0, 8352.0, 5361.0, 3657.0, 2461.0, 1603.0, 1100.0, 734.0, 500.0, 332.0, 206.0, 142.0, 85.0, 66.0, 32.0, 31.0, 25.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.43017578125, -0.4165802001953125, -0.402984619140625, -0.3893890380859375, -0.37579345703125, -0.3621978759765625, -0.348602294921875, -0.3350067138671875, -0.3214111328125, -0.3078155517578125, -0.294219970703125, -0.2806243896484375, -0.26702880859375, -0.2534332275390625, -0.239837646484375, -0.2262420654296875, -0.212646484375, -0.1990509033203125, -0.185455322265625, -0.1718597412109375, -0.15826416015625, -0.1446685791015625, -0.131072998046875, -0.1174774169921875, -0.1038818359375, -0.0902862548828125, -0.076690673828125, -0.0630950927734375, -0.04949951171875, -0.0359039306640625, -0.022308349609375, -0.0087127685546875, 0.0048828125, 0.0184783935546875, 0.032073974609375, 0.0456695556640625, 0.05926513671875, 0.0728607177734375, 0.086456298828125, 0.1000518798828125, 0.1136474609375, 0.1272430419921875, 0.140838623046875, 0.1544342041015625, 0.16802978515625, 0.1816253662109375, 0.195220947265625, 0.2088165283203125, 0.222412109375, 0.2360076904296875, 0.249603271484375, 0.2631988525390625, 0.27679443359375, 0.2903900146484375, 0.303985595703125, 0.3175811767578125, 0.3311767578125, 0.3447723388671875, 0.358367919921875, 0.3719635009765625, 0.38555908203125, 0.3991546630859375, 0.412750244140625, 0.4263458251953125, 0.43994140625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 6.0, 12.0, 9.0, 17.0, 15.0, 12.0, 16.0, 28.0, 25.0, 34.0, 29.0, 51.0, 49.0, 41.0, 46.0, 50.0, 59.0, 50.0, 67.0, 54.0, 54.0, 42.0, 33.0, 37.0, 26.0, 25.0, 13.0, 16.0, 13.0, 14.0, 9.0, 4.0, 8.0, 5.0, 5.0, 1.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0002791881561279297, -0.0002708137035369873, -0.0002624392509460449, -0.00025406479835510254, -0.00024569034576416016, -0.00023731589317321777, -0.0002289414405822754, -0.000220566987991333, -0.00021219253540039062, -0.00020381808280944824, -0.00019544363021850586, -0.00018706917762756348, -0.0001786947250366211, -0.0001703202724456787, -0.00016194581985473633, -0.00015357136726379395, -0.00014519691467285156, -0.00013682246208190918, -0.0001284480094909668, -0.00012007355690002441, -0.00011169910430908203, -0.00010332465171813965, -9.495019912719727e-05, -8.657574653625488e-05, -7.82012939453125e-05, -6.982684135437012e-05, -6.145238876342773e-05, -5.307793617248535e-05, -4.470348358154297e-05, -3.6329030990600586e-05, -2.7954578399658203e-05, -1.958012580871582e-05, -1.1205673217773438e-05, -2.8312206268310547e-06, 5.543231964111328e-06, 1.3917684555053711e-05, 2.2292137145996094e-05, 3.0666589736938477e-05, 3.904104232788086e-05, 4.741549491882324e-05, 5.5789947509765625e-05, 6.416440010070801e-05, 7.253885269165039e-05, 8.091330528259277e-05, 8.928775787353516e-05, 9.766221046447754e-05, 0.00010603666305541992, 0.0001144111156463623, 0.0001227855682373047, 0.00013116002082824707, 0.00013953447341918945, 0.00014790892601013184, 0.00015628337860107422, 0.0001646578311920166, 0.00017303228378295898, 0.00018140673637390137, 0.00018978118896484375, 0.00019815564155578613, 0.00020653009414672852, 0.0002149045467376709, 0.00022327899932861328, 0.00023165345191955566, 0.00024002790451049805, 0.00024840235710144043, 0.0002567768096923828]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 7.0, 5.0, 7.0, 5.0, 11.0, 18.0, 13.0, 26.0, 30.0, 42.0, 41.0, 62.0, 73.0, 145.0, 236.0, 400.0, 806.0, 5103.0, 996327.0, 42811.0, 1104.0, 461.0, 233.0, 162.0, 103.0, 79.0, 54.0, 41.0, 26.0, 16.0, 26.0, 12.0, 9.0, 9.0, 10.0, 13.0, 9.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00519561767578125, -0.0050261616706848145, -0.004856705665588379, -0.004687249660491943, -0.004517793655395508, -0.004348337650299072, -0.004178881645202637, -0.004009425640106201, -0.0038399696350097656, -0.00367051362991333, -0.0035010576248168945, -0.003331601619720459, -0.0031621456146240234, -0.002992689609527588, -0.0028232336044311523, -0.002653777599334717, -0.0024843215942382812, -0.0023148655891418457, -0.00214540958404541, -0.0019759535789489746, -0.001806497573852539, -0.0016370415687561035, -0.001467585563659668, -0.0012981295585632324, -0.0011286735534667969, -0.0009592175483703613, -0.0007897615432739258, -0.0006203055381774902, -0.0004508495330810547, -0.00028139352798461914, -0.0001119375228881836, 5.751848220825195e-05, 0.0002269744873046875, 0.00039643049240112305, 0.0005658864974975586, 0.0007353425025939941, 0.0009047985076904297, 0.0010742545127868652, 0.0012437105178833008, 0.0014131665229797363, 0.0015826225280761719, 0.0017520785331726074, 0.001921534538269043, 0.0020909905433654785, 0.002260446548461914, 0.0024299025535583496, 0.002599358558654785, 0.0027688145637512207, 0.0029382705688476562, 0.003107726573944092, 0.0032771825790405273, 0.003446638584136963, 0.0036160945892333984, 0.003785550594329834, 0.0039550065994262695, 0.004124462604522705, 0.004293918609619141, 0.004463374614715576, 0.004632830619812012, 0.004802286624908447, 0.004971742630004883, 0.005141198635101318, 0.005310654640197754, 0.0054801106452941895, 0.005649566650390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 11.0, 62.0, 204.0, 405.0, 253.0, 63.0, 16.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009686995763331652, -0.0009487346396781504, -0.0009287697612307966, -0.0009088048245757818, -0.0008888398879207671, -0.0008688750094734132, -0.0008489100728183985, -0.0008289451943710446, -0.0008089802577160299, -0.0007890153210610151, -0.0007690504426136613, -0.0007490855059586465, -0.0007291205693036318, -0.0007091556908562779, -0.0006891907542012632, -0.0006692258175462484, -0.0006492609390988946, -0.0006292960024438798, -0.000609331123996526, -0.0005893661873415112, -0.0005694012506864965, -0.0005494363722391427, -0.0005294714355841279, -0.0005095065571367741, -0.0004895415622740984, -0.0004695766547229141, -0.00044961171806789935, -0.00042964681051671505, -0.00040968190296553075, -0.00038971699541434646, -0.0003697520587593317, -0.0003497871512081474, -0.0003298222436569631, -0.0003098573361057788, -0.00028989239945076406, -0.00026992749189957976, -0.00024996258434839547, -0.00022999766224529594, -0.00021003274014219642, -0.00019006783259101212, -0.0001701029104879126, -0.00015013798838481307, -0.00013017308083362877, -0.00011020815873052925, -9.024324390338734e-05, -7.027832907624543e-05, -5.03134069731459e-05, -3.0348499421961606e-05, -1.038357731886208e-05, 9.581339327269234e-06, 2.9546255973400548e-05, 4.9511174438521266e-05, 6.947608926566318e-05, 8.944100409280509e-05, 0.00010940592619590461, 0.0001293708337470889, 0.00014933575585018843, 0.00016930067795328796, 0.00018926558550447226, 0.00020923050760757178, 0.0002291954297106713, 0.0002491603372618556, 0.00026912527391687036, 0.0002890901523642242, 0.00030905508901923895]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 8.0, 9.0, 12.0, 10.0, 7.0, 13.0, 12.0, 24.0, 22.0, 21.0, 29.0, 40.0, 27.0, 37.0, 35.0, 49.0, 37.0, 38.0, 57.0, 39.0, 47.0, 43.0, 51.0, 38.0, 35.0, 30.0, 23.0, 27.0, 31.0, 25.0, 22.0, 17.0, 17.0, 12.0, 15.0, 6.0, 10.0, 5.0, 8.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015354156494140625, -0.00014870613813400269, -0.00014387071132659912, -0.00013903528451919556, -0.000134199857711792, -0.00012936443090438843, -0.00012452900409698486, -0.0001196935772895813, -0.00011485815048217773, -0.00011002272367477417, -0.0001051872968673706, -0.00010035187005996704, -9.551644325256348e-05, -9.068101644515991e-05, -8.584558963775635e-05, -8.101016283035278e-05, -7.617473602294922e-05, -7.133930921554565e-05, -6.650388240814209e-05, -6.166845560073853e-05, -5.683302879333496e-05, -5.1997601985931396e-05, -4.716217517852783e-05, -4.232674837112427e-05, -3.74913215637207e-05, -3.265589475631714e-05, -2.7820467948913574e-05, -2.298504114151001e-05, -1.8149614334106445e-05, -1.3314187526702881e-05, -8.478760719299316e-06, -3.643333911895752e-06, 1.1920928955078125e-06, 6.027519702911377e-06, 1.0862946510314941e-05, 1.5698373317718506e-05, 2.053380012512207e-05, 2.5369226932525635e-05, 3.02046537399292e-05, 3.5040080547332764e-05, 3.987550735473633e-05, 4.471093416213989e-05, 4.954636096954346e-05, 5.438178777694702e-05, 5.9217214584350586e-05, 6.405264139175415e-05, 6.888806819915771e-05, 7.372349500656128e-05, 7.855892181396484e-05, 8.339434862136841e-05, 8.822977542877197e-05, 9.306520223617554e-05, 9.79006290435791e-05, 0.00010273605585098267, 0.00010757148265838623, 0.0001124069094657898, 0.00011724233627319336, 0.00012207776308059692, 0.0001269131898880005, 0.00013174861669540405, 0.00013658404350280762, 0.00014141947031021118, 0.00014625489711761475, 0.0001510903239250183, 0.00015592575073242188]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 3.0, 9.0, 5.0, 15.0, 13.0, 15.0, 14.0, 20.0, 16.0, 18.0, 20.0, 21.0, 29.0, 23.0, 30.0, 30.0, 36.0, 41.0, 44.0, 52.0, 41.0, 44.0, 40.0, 39.0, 36.0, 35.0, 33.0, 32.0, 38.0, 23.0, 20.0, 24.0, 25.0, 12.0, 10.0, 13.0, 13.0, 7.0, 12.0, 11.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.42578125, -2.35235595703125, -2.2789306640625, -2.20550537109375, -2.132080078125, -2.05865478515625, -1.9852294921875, -1.91180419921875, -1.83837890625, -1.76495361328125, -1.6915283203125, -1.61810302734375, -1.544677734375, -1.47125244140625, -1.3978271484375, -1.32440185546875, -1.2509765625, -1.17755126953125, -1.1041259765625, -1.03070068359375, -0.957275390625, -0.88385009765625, -0.8104248046875, -0.73699951171875, -0.66357421875, -0.59014892578125, -0.5167236328125, -0.44329833984375, -0.369873046875, -0.29644775390625, -0.2230224609375, -0.14959716796875, -0.076171875, -0.00274658203125, 0.0706787109375, 0.14410400390625, 0.217529296875, 0.29095458984375, 0.3643798828125, 0.43780517578125, 0.51123046875, 0.58465576171875, 0.6580810546875, 0.73150634765625, 0.804931640625, 0.87835693359375, 0.9517822265625, 1.02520751953125, 1.0986328125, 1.17205810546875, 1.2454833984375, 1.31890869140625, 1.392333984375, 1.46575927734375, 1.5391845703125, 1.61260986328125, 1.68603515625, 1.75946044921875, 1.8328857421875, 1.90631103515625, 1.979736328125, 2.05316162109375, 2.1265869140625, 2.20001220703125, 2.2734375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 11.0, 19.0, 30.0, 35.0, 49.0, 71.0, 114.0, 140.0, 237.0, 321.0, 538.0, 1039.0, 2322.0, 6001.0, 16627.0, 44756.0, 114712.0, 287360.0, 343159.0, 140792.0, 55805.0, 21025.0, 7433.0, 2930.0, 1191.0, 658.0, 403.0, 247.0, 155.0, 112.0, 71.0, 57.0, 36.0, 34.0, 13.0, 12.0, 12.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.326171875, -3.228668212890625, -3.13116455078125, -3.033660888671875, -2.9361572265625, -2.838653564453125, -2.74114990234375, -2.643646240234375, -2.546142578125, -2.448638916015625, -2.35113525390625, -2.253631591796875, -2.1561279296875, -2.058624267578125, -1.96112060546875, -1.863616943359375, -1.76611328125, -1.668609619140625, -1.57110595703125, -1.473602294921875, -1.3760986328125, -1.278594970703125, -1.18109130859375, -1.083587646484375, -0.986083984375, -0.888580322265625, -0.79107666015625, -0.693572998046875, -0.5960693359375, -0.498565673828125, -0.40106201171875, -0.303558349609375, -0.2060546875, -0.108551025390625, -0.01104736328125, 0.086456298828125, 0.1839599609375, 0.281463623046875, 0.37896728515625, 0.476470947265625, 0.573974609375, 0.671478271484375, 0.76898193359375, 0.866485595703125, 0.9639892578125, 1.061492919921875, 1.15899658203125, 1.256500244140625, 1.35400390625, 1.451507568359375, 1.54901123046875, 1.646514892578125, 1.7440185546875, 1.841522216796875, 1.93902587890625, 2.036529541015625, 2.134033203125, 2.231536865234375, 2.32904052734375, 2.426544189453125, 2.5240478515625, 2.621551513671875, 2.71905517578125, 2.816558837890625, 2.9140625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 7.0, 10.0, 10.0, 15.0, 15.0, 14.0, 26.0, 22.0, 33.0, 24.0, 44.0, 33.0, 43.0, 49.0, 85.0, 125.0, 335.0, 1451.0, 185.0, 93.0, 72.0, 45.0, 33.0, 43.0, 31.0, 36.0, 20.0, 33.0, 23.0, 20.0, 13.0, 11.0, 19.0, 5.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8515625, -7.5513916015625, -7.251220703125, -6.9510498046875, -6.65087890625, -6.3507080078125, -6.050537109375, -5.7503662109375, -5.4501953125, -5.1500244140625, -4.849853515625, -4.5496826171875, -4.24951171875, -3.9493408203125, -3.649169921875, -3.3489990234375, -3.048828125, -2.7486572265625, -2.448486328125, -2.1483154296875, -1.84814453125, -1.5479736328125, -1.247802734375, -0.9476318359375, -0.6474609375, -0.3472900390625, -0.047119140625, 0.2530517578125, 0.55322265625, 0.8533935546875, 1.153564453125, 1.4537353515625, 1.75390625, 2.0540771484375, 2.354248046875, 2.6544189453125, 2.95458984375, 3.2547607421875, 3.554931640625, 3.8551025390625, 4.1552734375, 4.4554443359375, 4.755615234375, 5.0557861328125, 5.35595703125, 5.6561279296875, 5.956298828125, 6.2564697265625, 6.556640625, 6.8568115234375, 7.156982421875, 7.4571533203125, 7.75732421875, 8.0574951171875, 8.357666015625, 8.6578369140625, 8.9580078125, 9.2581787109375, 9.558349609375, 9.8585205078125, 10.15869140625, 10.4588623046875, 10.759033203125, 11.0592041015625, 11.359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 6.0, 13.0, 10.0, 17.0, 22.0, 33.0, 31.0, 40.0, 59.0, 76.0, 115.0, 168.0, 232.0, 413.0, 1152.0, 49961.0, 3085490.0, 6176.0, 680.0, 318.0, 188.0, 115.0, 88.0, 65.0, 59.0, 46.0, 25.0, 16.0, 11.0, 12.0, 8.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.046875, -26.057373046875, -25.06787109375, -24.078369140625, -23.0888671875, -22.099365234375, -21.10986328125, -20.120361328125, -19.130859375, -18.141357421875, -17.15185546875, -16.162353515625, -15.1728515625, -14.183349609375, -13.19384765625, -12.204345703125, -11.21484375, -10.225341796875, -9.23583984375, -8.246337890625, -7.2568359375, -6.267333984375, -5.27783203125, -4.288330078125, -3.298828125, -2.309326171875, -1.31982421875, -0.330322265625, 0.6591796875, 1.648681640625, 2.63818359375, 3.627685546875, 4.6171875, 5.606689453125, 6.59619140625, 7.585693359375, 8.5751953125, 9.564697265625, 10.55419921875, 11.543701171875, 12.533203125, 13.522705078125, 14.51220703125, 15.501708984375, 16.4912109375, 17.480712890625, 18.47021484375, 19.459716796875, 20.44921875, 21.438720703125, 22.42822265625, 23.417724609375, 24.4072265625, 25.396728515625, 26.38623046875, 27.375732421875, 28.365234375, 29.354736328125, 30.34423828125, 31.333740234375, 32.3232421875, 33.312744140625, 34.30224609375, 35.291748046875, 36.28125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 7.0, 260.0, 724.0, 27.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.614267349243164, -20.674463272094727, -16.73465919494629, -12.794856071472168, -8.85505199432373, -4.915248870849609, -0.9754447937011719, 2.9643592834472656, 6.904163360595703, 10.84396743774414, 14.783771514892578, 18.723575592041016, 22.663379669189453, 26.603181838989258, 30.542985916137695, 34.4827880859375, 38.42259216308594, 42.362396240234375, 46.30220031738281, 50.24200439453125, 54.18180847167969, 58.121612548828125, 62.06141662597656, 66.001220703125, 69.94102478027344, 73.88082885742188, 77.82063293457031, 81.76043701171875, 85.70024108886719, 89.64004516601562, 93.57984924316406, 97.5196533203125, 101.4594497680664, 105.39925384521484, 109.33905792236328, 113.27886199951172, 117.21866607666016, 121.1584701538086, 125.09827423095703, 129.03807067871094, 132.97787475585938, 136.9176788330078, 140.85748291015625, 144.7972869873047, 148.73709106445312, 152.67689514160156, 156.61669921875, 160.55650329589844, 164.49630737304688, 168.4361114501953, 172.37591552734375, 176.3157196044922, 180.25552368164062, 184.19532775878906, 188.1351318359375, 192.07493591308594, 196.01473999023438, 199.9545440673828, 203.89434814453125, 207.8341522216797, 211.77395629882812, 215.71376037597656, 219.653564453125, 223.59336853027344, 227.53317260742188]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 9.0, 12.0, 6.0, 7.0, 7.0, 15.0, 10.0, 18.0, 18.0, 22.0, 25.0, 35.0, 33.0, 24.0, 30.0, 40.0, 36.0, 38.0, 40.0, 44.0, 46.0, 35.0, 45.0, 43.0, 32.0, 29.0, 31.0, 34.0, 24.0, 31.0, 33.0, 25.0, 20.0, 21.0, 19.0, 13.0, 8.0, 8.0, 7.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-29.23430061340332, -28.441085815429688, -27.647872924804688, -26.854658126831055, -26.061443328857422, -25.268230438232422, -24.47501564025879, -23.681800842285156, -22.888587951660156, -22.095373153686523, -21.302160263061523, -20.50894546508789, -19.715730667114258, -18.922515869140625, -18.129302978515625, -17.336088180541992, -16.54287338256836, -15.749659538269043, -14.95644474029541, -14.163230895996094, -13.370016098022461, -12.576802253723145, -11.783588409423828, -10.990373611450195, -10.197159767150879, -9.403945922851562, -8.61073112487793, -7.817517280578613, -7.024302959442139, -6.231088638305664, -5.437874794006348, -4.644660472869873, -3.8514480590820312, -3.0582337379455566, -2.265019655227661, -1.4718055725097656, -0.678591251373291, 0.1146230697631836, 0.9078369140625, 1.7010512351989746, 2.494265556335449, 3.287479877471924, 4.080694198608398, 4.873908042907715, 5.6671223640441895, 6.460336685180664, 7.2535505294799805, 8.046764373779297, 8.83997917175293, 9.633193016052246, 10.426407814025879, 11.219621658325195, 12.012836456298828, 12.806050300598145, 13.599264144897461, 14.392478942871094, 15.18569278717041, 15.978906631469727, 16.77212142944336, 17.56533432006836, 18.358549118041992, 19.151763916015625, 19.944976806640625, 20.738191604614258, 21.53140640258789]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 2.0, 6.0, 7.0, 5.0, 5.0, 11.0, 18.0, 12.0, 13.0, 15.0, 19.0, 22.0, 24.0, 26.0, 41.0, 28.0, 31.0, 46.0, 38.0, 41.0, 46.0, 48.0, 50.0, 37.0, 35.0, 46.0, 38.0, 44.0, 29.0, 24.0, 29.0, 32.0, 18.0, 14.0, 22.0, 8.0, 10.0, 14.0, 11.0, 5.0, 9.0, 7.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.904296875, -2.813507080078125, -2.72271728515625, -2.631927490234375, -2.5411376953125, -2.450347900390625, -2.35955810546875, -2.268768310546875, -2.177978515625, -2.087188720703125, -1.99639892578125, -1.905609130859375, -1.8148193359375, -1.724029541015625, -1.63323974609375, -1.542449951171875, -1.45166015625, -1.360870361328125, -1.27008056640625, -1.179290771484375, -1.0885009765625, -0.997711181640625, -0.90692138671875, -0.816131591796875, -0.725341796875, -0.634552001953125, -0.54376220703125, -0.452972412109375, -0.3621826171875, -0.271392822265625, -0.18060302734375, -0.089813232421875, 0.0009765625, 0.091766357421875, 0.18255615234375, 0.273345947265625, 0.3641357421875, 0.454925537109375, 0.54571533203125, 0.636505126953125, 0.727294921875, 0.818084716796875, 0.90887451171875, 0.999664306640625, 1.0904541015625, 1.181243896484375, 1.27203369140625, 1.362823486328125, 1.45361328125, 1.544403076171875, 1.63519287109375, 1.725982666015625, 1.8167724609375, 1.907562255859375, 1.99835205078125, 2.089141845703125, 2.179931640625, 2.270721435546875, 2.36151123046875, 2.452301025390625, 2.5430908203125, 2.633880615234375, 2.72467041015625, 2.815460205078125, 2.90625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 10.0, 9.0, 15.0, 11.0, 18.0, 14.0, 14.0, 20.0, 19.0, 39.0, 45.0, 43.0, 65.0, 139.0, 293.0, 850.0, 4361.0, 120869.0, 2561323.0, 1463866.0, 38001.0, 2667.0, 786.0, 279.0, 162.0, 80.0, 51.0, 38.0, 22.0, 19.0, 27.0, 19.0, 10.0, 14.0, 5.0, 10.0, 9.0, 10.0, 8.0, 12.0, 0.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.609375, -9.31689453125, -9.0244140625, -8.73193359375, -8.439453125, -8.14697265625, -7.8544921875, -7.56201171875, -7.26953125, -6.97705078125, -6.6845703125, -6.39208984375, -6.099609375, -5.80712890625, -5.5146484375, -5.22216796875, -4.9296875, -4.63720703125, -4.3447265625, -4.05224609375, -3.759765625, -3.46728515625, -3.1748046875, -2.88232421875, -2.58984375, -2.29736328125, -2.0048828125, -1.71240234375, -1.419921875, -1.12744140625, -0.8349609375, -0.54248046875, -0.25, 0.04248046875, 0.3349609375, 0.62744140625, 0.919921875, 1.21240234375, 1.5048828125, 1.79736328125, 2.08984375, 2.38232421875, 2.6748046875, 2.96728515625, 3.259765625, 3.55224609375, 3.8447265625, 4.13720703125, 4.4296875, 4.72216796875, 5.0146484375, 5.30712890625, 5.599609375, 5.89208984375, 6.1845703125, 6.47705078125, 6.76953125, 7.06201171875, 7.3544921875, 7.64697265625, 7.939453125, 8.23193359375, 8.5244140625, 8.81689453125, 9.109375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 14.0, 17.0, 16.0, 22.0, 38.0, 51.0, 60.0, 91.0, 110.0, 174.0, 222.0, 274.0, 322.0, 370.0, 399.0, 384.0, 356.0, 275.0, 202.0, 159.0, 123.0, 109.0, 67.0, 48.0, 50.0, 30.0, 23.0, 14.0, 11.0, 5.0, 8.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.71875, -5.5430908203125, -5.367431640625, -5.1917724609375, -5.01611328125, -4.8404541015625, -4.664794921875, -4.4891357421875, -4.3134765625, -4.1378173828125, -3.962158203125, -3.7864990234375, -3.61083984375, -3.4351806640625, -3.259521484375, -3.0838623046875, -2.908203125, -2.7325439453125, -2.556884765625, -2.3812255859375, -2.20556640625, -2.0299072265625, -1.854248046875, -1.6785888671875, -1.5029296875, -1.3272705078125, -1.151611328125, -0.9759521484375, -0.80029296875, -0.6246337890625, -0.448974609375, -0.2733154296875, -0.09765625, 0.0780029296875, 0.253662109375, 0.4293212890625, 0.60498046875, 0.7806396484375, 0.956298828125, 1.1319580078125, 1.3076171875, 1.4832763671875, 1.658935546875, 1.8345947265625, 2.01025390625, 2.1859130859375, 2.361572265625, 2.5372314453125, 2.712890625, 2.8885498046875, 3.064208984375, 3.2398681640625, 3.41552734375, 3.5911865234375, 3.766845703125, 3.9425048828125, 4.1181640625, 4.2938232421875, 4.469482421875, 4.6451416015625, 4.82080078125, 4.9964599609375, 5.172119140625, 5.3477783203125, 5.5234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 8.0, 9.0, 9.0, 17.0, 16.0, 31.0, 49.0, 62.0, 91.0, 106.0, 182.0, 214.0, 285.0, 504.0, 1217.0, 25683.0, 3447004.0, 712177.0, 4573.0, 729.0, 388.0, 264.0, 190.0, 125.0, 99.0, 70.0, 49.0, 35.0, 25.0, 22.0, 13.0, 14.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.03125, -17.405029296875, -16.77880859375, -16.152587890625, -15.5263671875, -14.900146484375, -14.27392578125, -13.647705078125, -13.021484375, -12.395263671875, -11.76904296875, -11.142822265625, -10.5166015625, -9.890380859375, -9.26416015625, -8.637939453125, -8.01171875, -7.385498046875, -6.75927734375, -6.133056640625, -5.5068359375, -4.880615234375, -4.25439453125, -3.628173828125, -3.001953125, -2.375732421875, -1.74951171875, -1.123291015625, -0.4970703125, 0.129150390625, 0.75537109375, 1.381591796875, 2.0078125, 2.634033203125, 3.26025390625, 3.886474609375, 4.5126953125, 5.138916015625, 5.76513671875, 6.391357421875, 7.017578125, 7.643798828125, 8.27001953125, 8.896240234375, 9.5224609375, 10.148681640625, 10.77490234375, 11.401123046875, 12.02734375, 12.653564453125, 13.27978515625, 13.906005859375, 14.5322265625, 15.158447265625, 15.78466796875, 16.410888671875, 17.037109375, 17.663330078125, 18.28955078125, 18.915771484375, 19.5419921875, 20.168212890625, 20.79443359375, 21.420654296875, 22.046875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 56.0, 244.0, 411.0, 238.0, 54.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.37199401855469, -96.48629760742188, -93.60060119628906, -90.71491241455078, -87.82921600341797, -84.94351959228516, -82.05783081054688, -79.17213439941406, -76.28643798828125, -73.40074157714844, -70.51504516601562, -67.62935638427734, -64.74365997314453, -61.85796356201172, -58.97227096557617, -56.086578369140625, -53.20088195800781, -50.315185546875, -47.42949295043945, -44.543800354003906, -41.658103942871094, -38.77240753173828, -35.886714935302734, -33.00102233886719, -30.115325927734375, -27.229631423950195, -24.343936920166016, -21.458242416381836, -18.572547912597656, -15.686853408813477, -12.801158905029297, -9.915464401245117, -7.0297698974609375, -4.144075393676758, -1.2583808898925781, 1.6273136138916016, 4.513008117675781, 7.398702621459961, 10.28439712524414, 13.17009162902832, 16.0557861328125, 18.94148063659668, 21.82717514038086, 24.71286964416504, 27.59856414794922, 30.4842586517334, 33.36995315551758, 36.255645751953125, 39.14134216308594, 42.02703857421875, 44.9127311706543, 47.798423767089844, 50.684120178222656, 53.56981658935547, 56.455509185791016, 59.34120178222656, 62.226898193359375, 65.11259460449219, 67.998291015625, 70.88397979736328, 73.7696762084961, 76.6553726196289, 79.54106140136719, 82.4267578125, 85.31245422363281]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 10.0, 13.0, 14.0, 17.0, 21.0, 16.0, 22.0, 24.0, 31.0, 39.0, 41.0, 40.0, 38.0, 35.0, 43.0, 49.0, 41.0, 44.0, 52.0, 49.0, 35.0, 46.0, 31.0, 34.0, 35.0, 30.0, 24.0, 18.0, 15.0, 12.0, 7.0, 11.0, 11.0, 5.0, 12.0, 10.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.26325225830078, -18.639440536499023, -18.015626907348633, -17.391815185546875, -16.768003463745117, -16.14419174194336, -15.520378112792969, -14.896566390991211, -14.272753715515137, -13.648941040039062, -13.025129318237305, -12.40131664276123, -11.777503967285156, -11.153692245483398, -10.529879570007324, -9.90606689453125, -9.282255172729492, -8.658442497253418, -8.03463077545166, -7.410818099975586, -6.78700590133667, -6.163193702697754, -5.53938102722168, -4.915568828582764, -4.291756629943848, -3.6679444313049316, -3.0441319942474365, -2.4203195571899414, -1.7965073585510254, -1.1726951599121094, -0.5488827228546143, 0.07492971420288086, 0.6987419128417969, 1.3225542306900024, 1.946366548538208, 2.570178985595703, 3.193991184234619, 3.817803382873535, 4.441616058349609, 5.065428256988525, 5.689240455627441, 6.313052654266357, 6.936864852905273, 7.560677528381348, 8.184490203857422, 8.80830192565918, 9.432114601135254, 10.055927276611328, 10.679738998413086, 11.30355167388916, 11.927363395690918, 12.551176071166992, 13.17498779296875, 13.798800468444824, 14.422613143920898, 15.046424865722656, 15.67023754119873, 16.294050216674805, 16.917861938476562, 17.54167366027832, 18.16548728942871, 18.78929901123047, 19.413110733032227, 20.036924362182617, 20.660736083984375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 9.0, 10.0, 15.0, 22.0, 15.0, 25.0, 22.0, 34.0, 35.0, 29.0, 35.0, 37.0, 41.0, 43.0, 49.0, 42.0, 51.0, 39.0, 52.0, 37.0, 43.0, 42.0, 36.0, 29.0, 33.0, 24.0, 18.0, 32.0, 21.0, 14.0, 10.0, 6.0, 10.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.019744873046875, -2.92620849609375, -2.832672119140625, -2.7391357421875, -2.645599365234375, -2.55206298828125, -2.458526611328125, -2.364990234375, -2.271453857421875, -2.17791748046875, -2.084381103515625, -1.9908447265625, -1.897308349609375, -1.80377197265625, -1.710235595703125, -1.61669921875, -1.523162841796875, -1.42962646484375, -1.336090087890625, -1.2425537109375, -1.149017333984375, -1.05548095703125, -0.961944580078125, -0.868408203125, -0.774871826171875, -0.68133544921875, -0.587799072265625, -0.4942626953125, -0.400726318359375, -0.30718994140625, -0.213653564453125, -0.1201171875, -0.026580810546875, 0.06695556640625, 0.160491943359375, 0.2540283203125, 0.347564697265625, 0.44110107421875, 0.534637451171875, 0.628173828125, 0.721710205078125, 0.81524658203125, 0.908782958984375, 1.0023193359375, 1.095855712890625, 1.18939208984375, 1.282928466796875, 1.37646484375, 1.470001220703125, 1.56353759765625, 1.657073974609375, 1.7506103515625, 1.844146728515625, 1.93768310546875, 2.031219482421875, 2.124755859375, 2.218292236328125, 2.31182861328125, 2.405364990234375, 2.4989013671875, 2.592437744140625, 2.68597412109375, 2.779510498046875, 2.873046875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 10.0, 10.0, 14.0, 13.0, 22.0, 36.0, 37.0, 63.0, 102.0, 127.0, 211.0, 299.0, 462.0, 780.0, 1129.0, 1866.0, 2919.0, 4876.0, 7488.0, 12303.0, 19930.0, 32437.0, 54822.0, 103209.0, 232474.0, 289340.0, 123512.0, 63711.0, 36927.0, 22611.0, 13801.0, 8593.0, 5287.0, 3303.0, 2123.0, 1243.0, 850.0, 561.0, 340.0, 247.0, 163.0, 104.0, 68.0, 51.0, 28.0, 25.0, 10.0, 10.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.52197265625, -0.5046463012695312, -0.4873199462890625, -0.46999359130859375, -0.452667236328125, -0.43534088134765625, -0.4180145263671875, -0.40068817138671875, -0.38336181640625, -0.36603546142578125, -0.3487091064453125, -0.33138275146484375, -0.314056396484375, -0.29673004150390625, -0.2794036865234375, -0.26207733154296875, -0.2447509765625, -0.22742462158203125, -0.2100982666015625, -0.19277191162109375, -0.175445556640625, -0.15811920166015625, -0.1407928466796875, -0.12346649169921875, -0.10614013671875, -0.08881378173828125, -0.0714874267578125, -0.05416107177734375, -0.036834716796875, -0.01950836181640625, -0.0021820068359375, 0.01514434814453125, 0.032470703125, 0.04979705810546875, 0.0671234130859375, 0.08444976806640625, 0.101776123046875, 0.11910247802734375, 0.1364288330078125, 0.15375518798828125, 0.17108154296875, 0.18840789794921875, 0.2057342529296875, 0.22306060791015625, 0.240386962890625, 0.25771331787109375, 0.2750396728515625, 0.29236602783203125, 0.3096923828125, 0.32701873779296875, 0.3443450927734375, 0.36167144775390625, 0.378997802734375, 0.39632415771484375, 0.4136505126953125, 0.43097686767578125, 0.44830322265625, 0.46562957763671875, 0.4829559326171875, 0.5002822875976562, 0.517608642578125, 0.5349349975585938, 0.5522613525390625, 0.5695877075195312, 0.5869140625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 5.0, 2.0, 6.0, 5.0, 7.0, 12.0, 6.0, 15.0, 14.0, 10.0, 17.0, 18.0, 30.0, 23.0, 27.0, 34.0, 28.0, 27.0, 32.0, 31.0, 35.0, 48.0, 47.0, 1057.0, 38.0, 38.0, 37.0, 42.0, 33.0, 37.0, 31.0, 31.0, 30.0, 29.0, 25.0, 24.0, 20.0, 14.0, 21.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.640625, -1.5855865478515625, -1.530548095703125, -1.4755096435546875, -1.42047119140625, -1.3654327392578125, -1.310394287109375, -1.2553558349609375, -1.2003173828125, -1.1452789306640625, -1.090240478515625, -1.0352020263671875, -0.98016357421875, -0.9251251220703125, -0.870086669921875, -0.8150482177734375, -0.760009765625, -0.7049713134765625, -0.649932861328125, -0.5948944091796875, -0.53985595703125, -0.4848175048828125, -0.429779052734375, -0.3747406005859375, -0.3197021484375, -0.2646636962890625, -0.209625244140625, -0.1545867919921875, -0.09954833984375, -0.0445098876953125, 0.010528564453125, 0.0655670166015625, 0.12060546875, 0.1756439208984375, 0.230682373046875, 0.2857208251953125, 0.34075927734375, 0.3957977294921875, 0.450836181640625, 0.5058746337890625, 0.5609130859375, 0.6159515380859375, 0.670989990234375, 0.7260284423828125, 0.78106689453125, 0.8361053466796875, 0.891143798828125, 0.9461822509765625, 1.001220703125, 1.0562591552734375, 1.111297607421875, 1.1663360595703125, 1.22137451171875, 1.2764129638671875, 1.331451416015625, 1.3864898681640625, 1.4415283203125, 1.4965667724609375, 1.551605224609375, 1.6066436767578125, 1.66168212890625, 1.7167205810546875, 1.771759033203125, 1.8267974853515625, 1.8818359375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 5.0, 12.0, 8.0, 25.0, 27.0, 44.0, 81.0, 99.0, 163.0, 196.0, 357.0, 468.0, 726.0, 1051.0, 1483.0, 2226.0, 3194.0, 4941.0, 7389.0, 11353.0, 17699.0, 28251.0, 45215.0, 78062.0, 146501.0, 1337546.0, 178003.0, 90189.0, 52024.0, 31605.0, 19887.0, 12868.0, 8464.0, 5580.0, 3675.0, 2521.0, 1687.0, 1135.0, 776.0, 538.0, 326.0, 259.0, 162.0, 105.0, 83.0, 36.0, 33.0, 14.0, 15.0, 18.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.43358612060546875, -0.4184417724609375, -0.40329742431640625, -0.388153076171875, -0.37300872802734375, -0.3578643798828125, -0.34272003173828125, -0.32757568359375, -0.31243133544921875, -0.2972869873046875, -0.28214263916015625, -0.266998291015625, -0.25185394287109375, -0.2367095947265625, -0.22156524658203125, -0.2064208984375, -0.19127655029296875, -0.1761322021484375, -0.16098785400390625, -0.145843505859375, -0.13069915771484375, -0.1155548095703125, -0.10041046142578125, -0.08526611328125, -0.07012176513671875, -0.0549774169921875, -0.03983306884765625, -0.024688720703125, -0.00954437255859375, 0.0055999755859375, 0.02074432373046875, 0.035888671875, 0.05103302001953125, 0.0661773681640625, 0.08132171630859375, 0.096466064453125, 0.11161041259765625, 0.1267547607421875, 0.14189910888671875, 0.15704345703125, 0.17218780517578125, 0.1873321533203125, 0.20247650146484375, 0.217620849609375, 0.23276519775390625, 0.2479095458984375, 0.26305389404296875, 0.2781982421875, 0.29334259033203125, 0.3084869384765625, 0.32363128662109375, 0.338775634765625, 0.35391998291015625, 0.3690643310546875, 0.38420867919921875, 0.39935302734375, 0.41449737548828125, 0.4296417236328125, 0.44478607177734375, 0.459930419921875, 0.47507476806640625, 0.4902191162109375, 0.5053634643554688, 0.5205078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 8.0, 11.0, 15.0, 17.0, 19.0, 25.0, 24.0, 48.0, 51.0, 40.0, 53.0, 59.0, 61.0, 69.0, 66.0, 65.0, 62.0, 48.0, 56.0, 38.0, 29.0, 24.0, 19.0, 14.0, 13.0, 15.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003540515899658203, -0.0003424994647502899, -0.0003309473395347595, -0.0003193952143192291, -0.00030784308910369873, -0.00029629096388816833, -0.00028473883867263794, -0.00027318671345710754, -0.00026163458824157715, -0.00025008246302604675, -0.00023853033781051636, -0.00022697821259498596, -0.00021542608737945557, -0.00020387396216392517, -0.00019232183694839478, -0.00018076971173286438, -0.00016921758651733398, -0.0001576654613018036, -0.0001461133360862732, -0.0001345612108707428, -0.0001230090856552124, -0.00011145696043968201, -9.990483522415161e-05, -8.835271000862122e-05, -7.680058479309082e-05, -6.524845957756042e-05, -5.369633436203003e-05, -4.2144209146499634e-05, -3.059208393096924e-05, -1.9039958715438843e-05, -7.487833499908447e-06, 4.064291715621948e-06, 1.5616416931152344e-05, 2.716854214668274e-05, 3.8720667362213135e-05, 5.027279257774353e-05, 6.182491779327393e-05, 7.337704300880432e-05, 8.492916822433472e-05, 9.648129343986511e-05, 0.00010803341865539551, 0.0001195855438709259, 0.0001311376690864563, 0.0001426897943019867, 0.0001542419195175171, 0.00016579404473304749, 0.00017734616994857788, 0.00018889829516410828, 0.00020045042037963867, 0.00021200254559516907, 0.00022355467081069946, 0.00023510679602622986, 0.00024665892124176025, 0.00025821104645729065, 0.00026976317167282104, 0.00028131529688835144, 0.00029286742210388184, 0.00030441954731941223, 0.0003159716725349426, 0.000327523797750473, 0.0003390759229660034, 0.0003506280481815338, 0.0003621801733970642, 0.0003737322986125946, 0.000385284423828125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 10.0, 7.0, 9.0, 16.0, 18.0, 21.0, 30.0, 29.0, 58.0, 67.0, 107.0, 155.0, 370.0, 863.0, 28850.0, 1014845.0, 1845.0, 527.0, 251.0, 123.0, 107.0, 61.0, 49.0, 30.0, 27.0, 26.0, 13.0, 8.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00848388671875, -0.008228898048400879, -0.007973909378051758, -0.007718920707702637, -0.007463932037353516, -0.0072089433670043945, -0.0069539546966552734, -0.006698966026306152, -0.006443977355957031, -0.00618898868560791, -0.005934000015258789, -0.005679011344909668, -0.005424022674560547, -0.005169034004211426, -0.004914045333862305, -0.004659056663513184, -0.0044040679931640625, -0.004149079322814941, -0.0038940906524658203, -0.0036391019821166992, -0.003384113311767578, -0.003129124641418457, -0.002874135971069336, -0.002619147300720215, -0.0023641586303710938, -0.0021091699600219727, -0.0018541812896728516, -0.0015991926193237305, -0.0013442039489746094, -0.0010892152786254883, -0.0008342266082763672, -0.0005792379379272461, -0.000324249267578125, -6.92605972290039e-05, 0.0001857280731201172, 0.0004407167434692383, 0.0006957054138183594, 0.0009506940841674805, 0.0012056827545166016, 0.0014606714248657227, 0.0017156600952148438, 0.001970648765563965, 0.002225637435913086, 0.002480626106262207, 0.002735614776611328, 0.0029906034469604492, 0.0032455921173095703, 0.0035005807876586914, 0.0037555694580078125, 0.004010558128356934, 0.004265546798706055, 0.004520535469055176, 0.004775524139404297, 0.005030512809753418, 0.005285501480102539, 0.00554049015045166, 0.005795478820800781, 0.006050467491149902, 0.0063054561614990234, 0.0065604448318481445, 0.006815433502197266, 0.007070422172546387, 0.007325410842895508, 0.007580399513244629, 0.00783538818359375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 11.0, 59.0, 313.0, 479.0, 140.0, 13.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006493672262877226, -0.0006214406457729638, -0.0005935140652582049, -0.0005655874847434461, -0.0005376609042286873, -0.0005097342655062675, -0.0004818077140953392, -0.0004538811044767499, -0.00042595452396199107, -0.00039802794344723225, -0.0003701013629324734, -0.0003421747824177146, -0.0003142481727991253, -0.0002863215922843665, -0.00025839501176960766, -0.0002304684167029336, -0.00020254185074009, -0.0001746152702253312, -0.00014668867515865713, -0.00011876209464389831, -9.083550685318187e-05, -6.290891906246543e-05, -3.4982338547706604e-05, -7.05574348103255e-06, 2.0870837033726275e-05, 4.8797424824442714e-05, 7.672401261515915e-05, 0.00010465059312991798, 0.0001325771736446768, 0.00016050376871135086, 0.00018843034922610968, 0.00021635694429278374, 0.00024428352480754256, 0.0002722101053223014, 0.0003001366858370602, 0.00032806326635181904, 0.0003559898759704083, 0.00038391645648516715, 0.00041184303699992597, 0.00043976964661851525, 0.0004676962271332741, 0.0004956228076480329, 0.0005235493881627917, 0.0005514759686775506, 0.0005794025491923094, 0.0006073291879147291, 0.000635255710221827, 0.0006631823489442468, 0.0006911088712513447, 0.0007190354517661035, 0.0007469620322808623, 0.0007748886127956212, 0.00080281519331038, 0.0008307418320327997, 0.0008586683543398976, 0.0008865949930623174, 0.0009145215735770762, 0.000942448154091835, 0.0009703747346065938, 0.0009983013151213527, 0.0010262279538437724, 0.0010541544761508703, 0.00108208111487329, 0.001110007637180388, 0.0011379342759028077]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 1.0, 11.0, 8.0, 17.0, 11.0, 10.0, 16.0, 19.0, 18.0, 34.0, 27.0, 37.0, 46.0, 33.0, 28.0, 33.0, 32.0, 46.0, 49.0, 39.0, 43.0, 41.0, 57.0, 43.0, 40.0, 34.0, 26.0, 33.0, 25.0, 25.0, 27.0, 17.0, 9.0, 15.0, 19.0, 6.0, 2.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016677379608154297, -0.00016130134463310242, -0.00015582889318466187, -0.0001503564417362213, -0.00014488399028778076, -0.0001394115388393402, -0.00013393908739089966, -0.0001284666359424591, -0.00012299418449401855, -0.000117521733045578, -0.00011204928159713745, -0.0001065768301486969, -0.00010110437870025635, -9.56319272518158e-05, -9.015947580337524e-05, -8.468702435493469e-05, -7.921457290649414e-05, -7.374212145805359e-05, -6.826967000961304e-05, -6.279721856117249e-05, -5.7324767112731934e-05, -5.185231566429138e-05, -4.637986421585083e-05, -4.090741276741028e-05, -3.5434961318969727e-05, -2.9962509870529175e-05, -2.4490058422088623e-05, -1.901760697364807e-05, -1.354515552520752e-05, -8.072704076766968e-06, -2.600252628326416e-06, 2.8721988201141357e-06, 8.344650268554688e-06, 1.381710171699524e-05, 1.928955316543579e-05, 2.4762004613876343e-05, 3.0234456062316895e-05, 3.5706907510757446e-05, 4.1179358959198e-05, 4.665181040763855e-05, 5.21242618560791e-05, 5.759671330451965e-05, 6.30691647529602e-05, 6.854161620140076e-05, 7.401406764984131e-05, 7.948651909828186e-05, 8.495897054672241e-05, 9.043142199516296e-05, 9.590387344360352e-05, 0.00010137632489204407, 0.00010684877634048462, 0.00011232122778892517, 0.00011779367923736572, 0.00012326613068580627, 0.00012873858213424683, 0.00013421103358268738, 0.00013968348503112793, 0.00014515593647956848, 0.00015062838792800903, 0.00015610083937644958, 0.00016157329082489014, 0.0001670457422733307, 0.00017251819372177124, 0.0001779906451702118, 0.00018346309661865234]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 9.0, 10.0, 15.0, 22.0, 15.0, 25.0, 22.0, 34.0, 35.0, 29.0, 35.0, 37.0, 41.0, 43.0, 49.0, 42.0, 51.0, 39.0, 52.0, 37.0, 43.0, 42.0, 36.0, 29.0, 33.0, 24.0, 18.0, 32.0, 21.0, 14.0, 10.0, 6.0, 10.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.019744873046875, -2.92620849609375, -2.832672119140625, -2.7391357421875, -2.645599365234375, -2.55206298828125, -2.458526611328125, -2.364990234375, -2.271453857421875, -2.17791748046875, -2.084381103515625, -1.9908447265625, -1.897308349609375, -1.80377197265625, -1.710235595703125, -1.61669921875, -1.523162841796875, -1.42962646484375, -1.336090087890625, -1.2425537109375, -1.149017333984375, -1.05548095703125, -0.961944580078125, -0.868408203125, -0.774871826171875, -0.68133544921875, -0.587799072265625, -0.4942626953125, -0.400726318359375, -0.30718994140625, -0.213653564453125, -0.1201171875, -0.026580810546875, 0.06695556640625, 0.160491943359375, 0.2540283203125, 0.347564697265625, 0.44110107421875, 0.534637451171875, 0.628173828125, 0.721710205078125, 0.81524658203125, 0.908782958984375, 1.0023193359375, 1.095855712890625, 1.18939208984375, 1.282928466796875, 1.37646484375, 1.470001220703125, 1.56353759765625, 1.657073974609375, 1.7506103515625, 1.844146728515625, 1.93768310546875, 2.031219482421875, 2.124755859375, 2.218292236328125, 2.31182861328125, 2.405364990234375, 2.4989013671875, 2.592437744140625, 2.68597412109375, 2.779510498046875, 2.873046875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 5.0, 9.0, 9.0, 19.0, 30.0, 36.0, 37.0, 83.0, 102.0, 153.0, 229.0, 356.0, 606.0, 1353.0, 3057.0, 7094.0, 18274.0, 50284.0, 139139.0, 355003.0, 293246.0, 112702.0, 40715.0, 14908.0, 5818.0, 2512.0, 1188.0, 601.0, 361.0, 184.0, 163.0, 76.0, 64.0, 27.0, 34.0, 16.0, 22.0, 7.0, 8.0, 6.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.41015625, -3.306488037109375, -3.20281982421875, -3.099151611328125, -2.9954833984375, -2.891815185546875, -2.78814697265625, -2.684478759765625, -2.580810546875, -2.477142333984375, -2.37347412109375, -2.269805908203125, -2.1661376953125, -2.062469482421875, -1.95880126953125, -1.855133056640625, -1.75146484375, -1.647796630859375, -1.54412841796875, -1.440460205078125, -1.3367919921875, -1.233123779296875, -1.12945556640625, -1.025787353515625, -0.922119140625, -0.818450927734375, -0.71478271484375, -0.611114501953125, -0.5074462890625, -0.403778076171875, -0.30010986328125, -0.196441650390625, -0.0927734375, 0.010894775390625, 0.11456298828125, 0.218231201171875, 0.3218994140625, 0.425567626953125, 0.52923583984375, 0.632904052734375, 0.736572265625, 0.840240478515625, 0.94390869140625, 1.047576904296875, 1.1512451171875, 1.254913330078125, 1.35858154296875, 1.462249755859375, 1.56591796875, 1.669586181640625, 1.77325439453125, 1.876922607421875, 1.9805908203125, 2.084259033203125, 2.18792724609375, 2.291595458984375, 2.395263671875, 2.498931884765625, 2.60260009765625, 2.706268310546875, 2.8099365234375, 2.913604736328125, 3.01727294921875, 3.120941162109375, 3.224609375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 15.0, 17.0, 25.0, 26.0, 23.0, 31.0, 23.0, 46.0, 52.0, 64.0, 70.0, 137.0, 263.0, 1521.0, 229.0, 93.0, 62.0, 53.0, 46.0, 32.0, 27.0, 31.0, 16.0, 27.0, 19.0, 17.0, 8.0, 6.0, 11.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.40625, -10.0521240234375, -9.697998046875, -9.3438720703125, -8.98974609375, -8.6356201171875, -8.281494140625, -7.9273681640625, -7.5732421875, -7.2191162109375, -6.864990234375, -6.5108642578125, -6.15673828125, -5.8026123046875, -5.448486328125, -5.0943603515625, -4.740234375, -4.3861083984375, -4.031982421875, -3.6778564453125, -3.32373046875, -2.9696044921875, -2.615478515625, -2.2613525390625, -1.9072265625, -1.5531005859375, -1.198974609375, -0.8448486328125, -0.49072265625, -0.1365966796875, 0.217529296875, 0.5716552734375, 0.92578125, 1.2799072265625, 1.634033203125, 1.9881591796875, 2.34228515625, 2.6964111328125, 3.050537109375, 3.4046630859375, 3.7587890625, 4.1129150390625, 4.467041015625, 4.8211669921875, 5.17529296875, 5.5294189453125, 5.883544921875, 6.2376708984375, 6.591796875, 6.9459228515625, 7.300048828125, 7.6541748046875, 8.00830078125, 8.3624267578125, 8.716552734375, 9.0706787109375, 9.4248046875, 9.7789306640625, 10.133056640625, 10.4871826171875, 10.84130859375, 11.1954345703125, 11.549560546875, 11.9036865234375, 12.2578125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 10.0, 3.0, 3.0, 12.0, 14.0, 15.0, 17.0, 21.0, 28.0, 36.0, 56.0, 59.0, 91.0, 151.0, 241.0, 417.0, 1152.0, 19126.0, 3115308.0, 6910.0, 903.0, 371.0, 220.0, 159.0, 104.0, 69.0, 41.0, 33.0, 21.0, 20.0, 15.0, 12.0, 11.0, 8.0, 7.0, 9.0, 6.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.0, -40.70361328125, -39.4072265625, -38.11083984375, -36.814453125, -35.51806640625, -34.2216796875, -32.92529296875, -31.62890625, -30.33251953125, -29.0361328125, -27.73974609375, -26.443359375, -25.14697265625, -23.8505859375, -22.55419921875, -21.2578125, -19.96142578125, -18.6650390625, -17.36865234375, -16.072265625, -14.77587890625, -13.4794921875, -12.18310546875, -10.88671875, -9.59033203125, -8.2939453125, -6.99755859375, -5.701171875, -4.40478515625, -3.1083984375, -1.81201171875, -0.515625, 0.78076171875, 2.0771484375, 3.37353515625, 4.669921875, 5.96630859375, 7.2626953125, 8.55908203125, 9.85546875, 11.15185546875, 12.4482421875, 13.74462890625, 15.041015625, 16.33740234375, 17.6337890625, 18.93017578125, 20.2265625, 21.52294921875, 22.8193359375, 24.11572265625, 25.412109375, 26.70849609375, 28.0048828125, 29.30126953125, 30.59765625, 31.89404296875, 33.1904296875, 34.48681640625, 35.783203125, 37.07958984375, 38.3759765625, 39.67236328125, 40.96875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 13.0, 41.0, 118.0, 208.0, 242.0, 190.0, 123.0, 48.0, 17.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.137881755828857, -6.310557842254639, -5.48323392868042, -4.655909538269043, -3.8285858631134033, -3.0012617111206055, -2.1739377975463867, -1.346613883972168, -0.5192899703979492, 0.3080340027809143, 1.1353579759597778, 1.9626820087432861, 2.790005922317505, 3.6173300743103027, 4.4446539878845215, 5.27197790145874, 6.099301815032959, 6.926625728607178, 7.7539496421813965, 8.581274032592773, 9.408597946166992, 10.235921859741211, 11.06324577331543, 11.890569686889648, 12.717893600463867, 13.545217514038086, 14.372541427612305, 15.199865341186523, 16.027189254760742, 16.85451316833496, 17.68183708190918, 18.5091609954834, 19.336484909057617, 20.163808822631836, 20.991132736206055, 21.818456649780273, 22.645780563354492, 23.47310447692871, 24.30042839050293, 25.12775230407715, 25.955076217651367, 26.782400131225586, 27.609724044799805, 28.437047958374023, 29.264371871948242, 30.09169578552246, 30.91901969909668, 31.7463436126709, 32.57366943359375, 33.40099334716797, 34.22831726074219, 35.055641174316406, 35.882965087890625, 36.710289001464844, 37.53761291503906, 38.36493682861328, 39.1922607421875, 40.01958465576172, 40.84690856933594, 41.674232482910156, 42.501556396484375, 43.328880310058594, 44.15620422363281, 44.98352813720703, 45.81085205078125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 5.0, 7.0, 8.0, 13.0, 13.0, 22.0, 15.0, 13.0, 19.0, 29.0, 21.0, 33.0, 43.0, 41.0, 36.0, 23.0, 45.0, 46.0, 34.0, 46.0, 44.0, 41.0, 46.0, 23.0, 39.0, 42.0, 32.0, 28.0, 20.0, 37.0, 17.0, 13.0, 28.0, 13.0, 8.0, 6.0, 10.0, 5.0, 8.0, 7.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-27.100921630859375, -26.310359954833984, -25.51979637145996, -24.72923469543457, -23.93867301940918, -23.148109436035156, -22.357547760009766, -21.566986083984375, -20.776424407958984, -19.985862731933594, -19.19529914855957, -18.40473747253418, -17.61417579650879, -16.823612213134766, -16.033050537109375, -15.242488861083984, -14.451925277709961, -13.661362648010254, -12.870800971984863, -12.080238342285156, -11.289676666259766, -10.499114036560059, -9.708551406860352, -8.917989730834961, -8.127427101135254, -7.336864948272705, -6.546302795410156, -5.755740165710449, -4.9651780128479, -4.174615859985352, -3.3840532302856445, -2.5934910774230957, -1.8029308319091797, -1.0123685598373413, -0.22180628776550293, 0.568756103515625, 1.3593182563781738, 2.1498804092407227, 2.9404430389404297, 3.7310051918029785, 4.521567344665527, 5.312129497528076, 6.102691650390625, 6.893254280090332, 7.683816432952881, 8.47437858581543, 9.264941215515137, 10.055503845214844, 10.846065521240234, 11.636628150939941, 12.427189826965332, 13.217752456665039, 14.00831413269043, 14.798876762390137, 15.589439392089844, 16.380001068115234, 17.170562744140625, 17.961124420166016, 18.75168800354004, 19.54224967956543, 20.33281135559082, 21.123374938964844, 21.913936614990234, 22.704498291015625, 23.49506187438965]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 7.0, 5.0, 6.0, 3.0, 12.0, 13.0, 13.0, 11.0, 28.0, 12.0, 22.0, 25.0, 22.0, 31.0, 37.0, 41.0, 40.0, 35.0, 35.0, 43.0, 39.0, 41.0, 31.0, 28.0, 37.0, 28.0, 46.0, 44.0, 39.0, 27.0, 23.0, 24.0, 16.0, 21.0, 23.0, 12.0, 16.0, 12.0, 12.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-3.123046875, -3.029815673828125, -2.93658447265625, -2.843353271484375, -2.7501220703125, -2.656890869140625, -2.56365966796875, -2.470428466796875, -2.377197265625, -2.283966064453125, -2.19073486328125, -2.097503662109375, -2.0042724609375, -1.911041259765625, -1.81781005859375, -1.724578857421875, -1.63134765625, -1.538116455078125, -1.44488525390625, -1.351654052734375, -1.2584228515625, -1.165191650390625, -1.07196044921875, -0.978729248046875, -0.885498046875, -0.792266845703125, -0.69903564453125, -0.605804443359375, -0.5125732421875, -0.419342041015625, -0.32611083984375, -0.232879638671875, -0.1396484375, -0.046417236328125, 0.04681396484375, 0.140045166015625, 0.2332763671875, 0.326507568359375, 0.41973876953125, 0.512969970703125, 0.606201171875, 0.699432373046875, 0.79266357421875, 0.885894775390625, 0.9791259765625, 1.072357177734375, 1.16558837890625, 1.258819580078125, 1.35205078125, 1.445281982421875, 1.53851318359375, 1.631744384765625, 1.7249755859375, 1.818206787109375, 1.91143798828125, 2.004669189453125, 2.097900390625, 2.191131591796875, 2.28436279296875, 2.377593994140625, 2.4708251953125, 2.564056396484375, 2.65728759765625, 2.750518798828125, 2.84375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 7.0, 4.0, 7.0, 18.0, 23.0, 21.0, 29.0, 21.0, 36.0, 51.0, 58.0, 106.0, 170.0, 255.0, 532.0, 1443.0, 8758.0, 139346.0, 1511165.0, 2182001.0, 326525.0, 19234.0, 2549.0, 783.0, 380.0, 214.0, 149.0, 88.0, 65.0, 52.0, 40.0, 23.0, 12.0, 15.0, 12.0, 14.0, 13.0, 8.0, 11.0, 3.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-7.28515625, -7.07183837890625, -6.8585205078125, -6.64520263671875, -6.431884765625, -6.21856689453125, -6.0052490234375, -5.79193115234375, -5.57861328125, -5.36529541015625, -5.1519775390625, -4.93865966796875, -4.725341796875, -4.51202392578125, -4.2987060546875, -4.08538818359375, -3.8720703125, -3.65875244140625, -3.4454345703125, -3.23211669921875, -3.018798828125, -2.80548095703125, -2.5921630859375, -2.37884521484375, -2.16552734375, -1.95220947265625, -1.7388916015625, -1.52557373046875, -1.312255859375, -1.09893798828125, -0.8856201171875, -0.67230224609375, -0.458984375, -0.24566650390625, -0.0323486328125, 0.18096923828125, 0.394287109375, 0.60760498046875, 0.8209228515625, 1.03424072265625, 1.24755859375, 1.46087646484375, 1.6741943359375, 1.88751220703125, 2.100830078125, 2.31414794921875, 2.5274658203125, 2.74078369140625, 2.9541015625, 3.16741943359375, 3.3807373046875, 3.59405517578125, 3.807373046875, 4.02069091796875, 4.2340087890625, 4.44732666015625, 4.66064453125, 4.87396240234375, 5.0872802734375, 5.30059814453125, 5.513916015625, 5.72723388671875, 5.9405517578125, 6.15386962890625, 6.3671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 9.0, 8.0, 24.0, 30.0, 39.0, 36.0, 57.0, 85.0, 115.0, 142.0, 226.0, 269.0, 348.0, 421.0, 443.0, 383.0, 369.0, 262.0, 207.0, 177.0, 114.0, 86.0, 57.0, 43.0, 39.0, 18.0, 16.0, 14.0, 8.0, 13.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.17108154296875, -5.9749755859375, -5.77886962890625, -5.582763671875, -5.38665771484375, -5.1905517578125, -4.99444580078125, -4.79833984375, -4.60223388671875, -4.4061279296875, -4.21002197265625, -4.013916015625, -3.81781005859375, -3.6217041015625, -3.42559814453125, -3.2294921875, -3.03338623046875, -2.8372802734375, -2.64117431640625, -2.445068359375, -2.24896240234375, -2.0528564453125, -1.85675048828125, -1.66064453125, -1.46453857421875, -1.2684326171875, -1.07232666015625, -0.876220703125, -0.68011474609375, -0.4840087890625, -0.28790283203125, -0.091796875, 0.10430908203125, 0.3004150390625, 0.49652099609375, 0.692626953125, 0.88873291015625, 1.0848388671875, 1.28094482421875, 1.47705078125, 1.67315673828125, 1.8692626953125, 2.06536865234375, 2.261474609375, 2.45758056640625, 2.6536865234375, 2.84979248046875, 3.0458984375, 3.24200439453125, 3.4381103515625, 3.63421630859375, 3.830322265625, 4.02642822265625, 4.2225341796875, 4.41864013671875, 4.61474609375, 4.81085205078125, 5.0069580078125, 5.20306396484375, 5.399169921875, 5.59527587890625, 5.7913818359375, 5.98748779296875, 6.18359375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 11.0, 12.0, 16.0, 21.0, 20.0, 44.0, 69.0, 74.0, 124.0, 127.0, 238.0, 297.0, 413.0, 866.0, 21210.0, 3509198.0, 656434.0, 3275.0, 536.0, 372.0, 268.0, 164.0, 140.0, 95.0, 54.0, 58.0, 47.0, 29.0, 25.0, 10.0, 10.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.015625, -21.34423828125, -20.6728515625, -20.00146484375, -19.330078125, -18.65869140625, -17.9873046875, -17.31591796875, -16.64453125, -15.97314453125, -15.3017578125, -14.63037109375, -13.958984375, -13.28759765625, -12.6162109375, -11.94482421875, -11.2734375, -10.60205078125, -9.9306640625, -9.25927734375, -8.587890625, -7.91650390625, -7.2451171875, -6.57373046875, -5.90234375, -5.23095703125, -4.5595703125, -3.88818359375, -3.216796875, -2.54541015625, -1.8740234375, -1.20263671875, -0.53125, 0.14013671875, 0.8115234375, 1.48291015625, 2.154296875, 2.82568359375, 3.4970703125, 4.16845703125, 4.83984375, 5.51123046875, 6.1826171875, 6.85400390625, 7.525390625, 8.19677734375, 8.8681640625, 9.53955078125, 10.2109375, 10.88232421875, 11.5537109375, 12.22509765625, 12.896484375, 13.56787109375, 14.2392578125, 14.91064453125, 15.58203125, 16.25341796875, 16.9248046875, 17.59619140625, 18.267578125, 18.93896484375, 19.6103515625, 20.28173828125, 20.953125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 7.0, 20.0, 31.0, 55.0, 58.0, 81.0, 90.0, 117.0, 104.0, 96.0, 96.0, 68.0, 52.0, 44.0, 32.0, 21.0, 15.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.229339599609375, -29.47683334350586, -28.724327087402344, -27.971820831298828, -27.219314575195312, -26.466808319091797, -25.71430206298828, -24.961795806884766, -24.20928955078125, -23.456783294677734, -22.70427703857422, -21.951770782470703, -21.199264526367188, -20.446758270263672, -19.694252014160156, -18.94174575805664, -18.189241409301758, -17.436735153198242, -16.684228897094727, -15.931722640991211, -15.179216384887695, -14.42671012878418, -13.67420482635498, -12.921698570251465, -12.16919231414795, -11.416686058044434, -10.664179801940918, -9.911674499511719, -9.159168243408203, -8.406661987304688, -7.654155731201172, -6.901649475097656, -6.149145126342773, -5.396638870239258, -4.644132614135742, -3.8916268348693848, -3.139120578765869, -2.3866143226623535, -1.634108543395996, -0.8816022872924805, -0.12909603118896484, 0.6234101057052612, 1.3759162425994873, 2.128422260284424, 2.8809285163879395, 3.633434772491455, 4.3859405517578125, 5.138446807861328, 5.890953063964844, 6.643459320068359, 7.395965576171875, 8.14847183227539, 8.900978088378906, 9.653484344482422, 10.405989646911621, 11.158495903015137, 11.911002159118652, 12.663508415222168, 13.416014671325684, 14.168519973754883, 14.921026229858398, 15.673532485961914, 16.42603874206543, 17.178544998168945, 17.93105125427246]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 1.0, 6.0, 9.0, 8.0, 9.0, 14.0, 8.0, 32.0, 15.0, 21.0, 32.0, 17.0, 44.0, 29.0, 34.0, 43.0, 42.0, 49.0, 47.0, 39.0, 46.0, 50.0, 47.0, 55.0, 44.0, 36.0, 45.0, 30.0, 32.0, 19.0, 22.0, 18.0, 11.0, 12.0, 12.0, 11.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.076969146728516, -20.358362197875977, -19.639753341674805, -18.921146392822266, -18.202539443969727, -17.483930587768555, -16.765323638916016, -16.046714782714844, -15.328107833862305, -14.60949993133545, -13.89089298248291, -13.172285079956055, -12.4536771774292, -11.735069274902344, -11.016462326049805, -10.29785442352295, -9.57924747467041, -8.860639572143555, -8.142032623291016, -7.42342472076416, -6.704816818237305, -5.986209392547607, -5.26760196685791, -4.548994064331055, -3.8303866386413574, -3.111778974533081, -2.3931713104248047, -1.6745638847351074, -0.955956220626831, -0.2373485565185547, 0.4812588691711426, 1.199866771697998, 1.9184741973876953, 2.6370818614959717, 3.355689525604248, 4.074296951293945, 4.792904853820801, 5.511512279510498, 6.230119705200195, 6.948727607727051, 7.667335033416748, 8.385942459106445, 9.1045503616333, 9.823158264160156, 10.541765213012695, 11.26037311553955, 11.978981018066406, 12.697587966918945, 13.4161958694458, 14.134803771972656, 14.853410720825195, 15.57201862335205, 16.290626525878906, 17.009233474731445, 17.727840423583984, 18.446449279785156, 19.165056228637695, 19.883663177490234, 20.602272033691406, 21.320878982543945, 22.039485931396484, 22.758094787597656, 23.476701736450195, 24.195308685302734, 24.913917541503906]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 10.0, 11.0, 14.0, 14.0, 15.0, 27.0, 16.0, 16.0, 19.0, 34.0, 36.0, 24.0, 28.0, 44.0, 37.0, 45.0, 34.0, 37.0, 33.0, 43.0, 38.0, 39.0, 37.0, 38.0, 36.0, 29.0, 36.0, 29.0, 20.0, 16.0, 19.0, 18.0, 24.0, 17.0, 11.0, 7.0, 7.0, 14.0, 6.0, 3.0, 4.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.76177978515625, -2.6719970703125, -2.58221435546875, -2.492431640625, -2.40264892578125, -2.3128662109375, -2.22308349609375, -2.13330078125, -2.04351806640625, -1.9537353515625, -1.86395263671875, -1.774169921875, -1.68438720703125, -1.5946044921875, -1.50482177734375, -1.4150390625, -1.32525634765625, -1.2354736328125, -1.14569091796875, -1.055908203125, -0.96612548828125, -0.8763427734375, -0.78656005859375, -0.69677734375, -0.60699462890625, -0.5172119140625, -0.42742919921875, -0.337646484375, -0.24786376953125, -0.1580810546875, -0.06829833984375, 0.021484375, 0.11126708984375, 0.2010498046875, 0.29083251953125, 0.380615234375, 0.47039794921875, 0.5601806640625, 0.64996337890625, 0.73974609375, 0.82952880859375, 0.9193115234375, 1.00909423828125, 1.098876953125, 1.18865966796875, 1.2784423828125, 1.36822509765625, 1.4580078125, 1.54779052734375, 1.6375732421875, 1.72735595703125, 1.817138671875, 1.90692138671875, 1.9967041015625, 2.08648681640625, 2.17626953125, 2.26605224609375, 2.3558349609375, 2.44561767578125, 2.535400390625, 2.62518310546875, 2.7149658203125, 2.80474853515625, 2.89453125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 7.0, 14.0, 16.0, 30.0, 44.0, 53.0, 98.0, 99.0, 148.0, 247.0, 402.0, 548.0, 801.0, 1231.0, 1728.0, 2577.0, 3838.0, 5766.0, 8419.0, 12789.0, 18863.0, 29283.0, 45331.0, 74132.0, 137112.0, 275459.0, 180946.0, 92373.0, 54390.0, 34463.0, 22068.0, 14924.0, 9909.0, 6700.0, 4504.0, 2926.0, 2073.0, 1419.0, 908.0, 581.0, 429.0, 307.0, 188.0, 119.0, 93.0, 72.0, 46.0, 29.0, 16.0, 18.0, 4.0, 10.0, 4.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.5205078125, -0.5045852661132812, -0.4886627197265625, -0.47274017333984375, -0.456817626953125, -0.44089508056640625, -0.4249725341796875, -0.40904998779296875, -0.39312744140625, -0.37720489501953125, -0.3612823486328125, -0.34535980224609375, -0.329437255859375, -0.31351470947265625, -0.2975921630859375, -0.28166961669921875, -0.2657470703125, -0.24982452392578125, -0.2339019775390625, -0.21797943115234375, -0.202056884765625, -0.18613433837890625, -0.1702117919921875, -0.15428924560546875, -0.13836669921875, -0.12244415283203125, -0.1065216064453125, -0.09059906005859375, -0.074676513671875, -0.05875396728515625, -0.0428314208984375, -0.02690887451171875, -0.010986328125, 0.00493621826171875, 0.0208587646484375, 0.03678131103515625, 0.052703857421875, 0.06862640380859375, 0.0845489501953125, 0.10047149658203125, 0.11639404296875, 0.13231658935546875, 0.1482391357421875, 0.16416168212890625, 0.180084228515625, 0.19600677490234375, 0.2119293212890625, 0.22785186767578125, 0.2437744140625, 0.25969696044921875, 0.2756195068359375, 0.29154205322265625, 0.307464599609375, 0.32338714599609375, 0.3393096923828125, 0.35523223876953125, 0.37115478515625, 0.38707733154296875, 0.4029998779296875, 0.41892242431640625, 0.434844970703125, 0.45076751708984375, 0.4666900634765625, 0.48261260986328125, 0.49853515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 8.0, 7.0, 10.0, 11.0, 7.0, 8.0, 13.0, 14.0, 17.0, 13.0, 14.0, 29.0, 27.0, 24.0, 29.0, 32.0, 41.0, 33.0, 47.0, 37.0, 37.0, 1062.0, 38.0, 37.0, 26.0, 37.0, 33.0, 26.0, 22.0, 27.0, 26.0, 33.0, 29.0, 31.0, 23.0, 16.0, 14.0, 12.0, 12.0, 14.0, 12.0, 5.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-1.935546875, -1.88006591796875, -1.8245849609375, -1.76910400390625, -1.713623046875, -1.65814208984375, -1.6026611328125, -1.54718017578125, -1.49169921875, -1.43621826171875, -1.3807373046875, -1.32525634765625, -1.269775390625, -1.21429443359375, -1.1588134765625, -1.10333251953125, -1.0478515625, -0.99237060546875, -0.9368896484375, -0.88140869140625, -0.825927734375, -0.77044677734375, -0.7149658203125, -0.65948486328125, -0.60400390625, -0.54852294921875, -0.4930419921875, -0.43756103515625, -0.382080078125, -0.32659912109375, -0.2711181640625, -0.21563720703125, -0.16015625, -0.10467529296875, -0.0491943359375, 0.00628662109375, 0.061767578125, 0.11724853515625, 0.1727294921875, 0.22821044921875, 0.28369140625, 0.33917236328125, 0.3946533203125, 0.45013427734375, 0.505615234375, 0.56109619140625, 0.6165771484375, 0.67205810546875, 0.7275390625, 0.78302001953125, 0.8385009765625, 0.89398193359375, 0.949462890625, 1.00494384765625, 1.0604248046875, 1.11590576171875, 1.17138671875, 1.22686767578125, 1.2823486328125, 1.33782958984375, 1.393310546875, 1.44879150390625, 1.5042724609375, 1.55975341796875, 1.615234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 10.0, 24.0, 24.0, 44.0, 40.0, 85.0, 143.0, 154.0, 252.0, 356.0, 612.0, 849.0, 1191.0, 1718.0, 2544.0, 3881.0, 5571.0, 8686.0, 13032.0, 20271.0, 31704.0, 51076.0, 87654.0, 173704.0, 1342331.0, 146130.0, 77403.0, 45662.0, 27971.0, 18045.0, 11778.0, 7834.0, 5150.0, 3529.0, 2454.0, 1694.0, 1125.0, 784.0, 521.0, 382.0, 211.0, 183.0, 117.0, 75.0, 44.0, 25.0, 21.0, 15.0, 7.0, 10.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5243377685546875, -0.508148193359375, -0.4919586181640625, -0.47576904296875, -0.4595794677734375, -0.443389892578125, -0.4272003173828125, -0.4110107421875, -0.3948211669921875, -0.378631591796875, -0.3624420166015625, -0.34625244140625, -0.3300628662109375, -0.313873291015625, -0.2976837158203125, -0.281494140625, -0.2653045654296875, -0.249114990234375, -0.2329254150390625, -0.21673583984375, -0.2005462646484375, -0.184356689453125, -0.1681671142578125, -0.1519775390625, -0.1357879638671875, -0.119598388671875, -0.1034088134765625, -0.08721923828125, -0.0710296630859375, -0.054840087890625, -0.0386505126953125, -0.0224609375, -0.0062713623046875, 0.009918212890625, 0.0261077880859375, 0.04229736328125, 0.0584869384765625, 0.074676513671875, 0.0908660888671875, 0.1070556640625, 0.1232452392578125, 0.139434814453125, 0.1556243896484375, 0.17181396484375, 0.1880035400390625, 0.204193115234375, 0.2203826904296875, 0.236572265625, 0.2527618408203125, 0.268951416015625, 0.2851409912109375, 0.30133056640625, 0.3175201416015625, 0.333709716796875, 0.3498992919921875, 0.3660888671875, 0.3822784423828125, 0.398468017578125, 0.4146575927734375, 0.43084716796875, 0.4470367431640625, 0.463226318359375, 0.4794158935546875, 0.49560546875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 3.0, 10.0, 12.0, 10.0, 20.0, 14.0, 23.0, 22.0, 33.0, 26.0, 30.0, 58.0, 60.0, 67.0, 66.0, 75.0, 69.0, 65.0, 51.0, 41.0, 49.0, 30.0, 23.0, 21.0, 19.0, 18.0, 13.0, 7.0, 12.0, 6.0, 4.0, 4.0, 4.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037384033203125, -0.00036083534359931946, -0.0003478303551673889, -0.0003348253667354584, -0.00032182037830352783, -0.0003088153898715973, -0.00029581040143966675, -0.0002828054130077362, -0.00026980042457580566, -0.0002567954361438751, -0.00024379044771194458, -0.00023078545928001404, -0.0002177804708480835, -0.00020477548241615295, -0.0001917704939842224, -0.00017876550555229187, -0.00016576051712036133, -0.00015275552868843079, -0.00013975054025650024, -0.0001267455518245697, -0.00011374056339263916, -0.00010073557496070862, -8.773058652877808e-05, -7.472559809684753e-05, -6.172060966491699e-05, -4.871562123298645e-05, -3.571063280105591e-05, -2.2705644369125366e-05, -9.700655937194824e-06, 3.3043324947357178e-06, 1.630932092666626e-05, 2.9314309358596802e-05, 4.2319297790527344e-05, 5.5324286222457886e-05, 6.832927465438843e-05, 8.133426308631897e-05, 9.433925151824951e-05, 0.00010734423995018005, 0.0001203492283821106, 0.00013335421681404114, 0.00014635920524597168, 0.00015936419367790222, 0.00017236918210983276, 0.0001853741705417633, 0.00019837915897369385, 0.0002113841474056244, 0.00022438913583755493, 0.00023739412426948547, 0.000250399112701416, 0.00026340410113334656, 0.0002764090895652771, 0.00028941407799720764, 0.0003024190664291382, 0.0003154240548610687, 0.00032842904329299927, 0.0003414340317249298, 0.00035443902015686035, 0.0003674440085887909, 0.00038044899702072144, 0.000393453985452652, 0.0004064589738845825, 0.00041946396231651306, 0.0004324689507484436, 0.00044547393918037415, 0.0004584789276123047]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 6.0, 4.0, 8.0, 8.0, 9.0, 13.0, 18.0, 15.0, 21.0, 26.0, 29.0, 37.0, 62.0, 83.0, 135.0, 216.0, 405.0, 950.0, 131347.0, 912327.0, 1452.0, 549.0, 251.0, 159.0, 80.0, 73.0, 56.0, 55.0, 27.0, 24.0, 23.0, 16.0, 16.0, 12.0, 10.0, 4.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00946807861328125, -0.009198606014251709, -0.008929133415222168, -0.008659660816192627, -0.008390188217163086, -0.008120715618133545, -0.007851243019104004, -0.007581770420074463, -0.007312297821044922, -0.007042825222015381, -0.00677335262298584, -0.006503880023956299, -0.006234407424926758, -0.005964934825897217, -0.005695462226867676, -0.005425989627838135, -0.005156517028808594, -0.004887044429779053, -0.004617571830749512, -0.004348099231719971, -0.00407862663269043, -0.0038091540336608887, -0.0035396814346313477, -0.0032702088356018066, -0.0030007362365722656, -0.0027312636375427246, -0.0024617910385131836, -0.0021923184394836426, -0.0019228458404541016, -0.0016533732414245605, -0.0013839006423950195, -0.0011144280433654785, -0.0008449554443359375, -0.0005754828453063965, -0.00030601024627685547, -3.653764724731445e-05, 0.00023293495178222656, 0.0005024075508117676, 0.0007718801498413086, 0.0010413527488708496, 0.0013108253479003906, 0.0015802979469299316, 0.0018497705459594727, 0.0021192431449890137, 0.0023887157440185547, 0.0026581883430480957, 0.0029276609420776367, 0.0031971335411071777, 0.0034666061401367188, 0.0037360787391662598, 0.004005551338195801, 0.004275023937225342, 0.004544496536254883, 0.004813969135284424, 0.005083441734313965, 0.005352914333343506, 0.005622386932373047, 0.005891859531402588, 0.006161332130432129, 0.00643080472946167, 0.006700277328491211, 0.006969749927520752, 0.007239222526550293, 0.007508695125579834, 0.007778167724609375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 54.0, 660.0, 297.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010406688088551164, -0.0009949058294296265, -0.0009491429664194584, -0.0009033800452016294, -0.0008576171239838004, -0.0008118542027659714, -0.0007660912815481424, -0.0007203283603303134, -0.0006745654391124845, -0.0006288025178946555, -0.0005830395966768265, -0.0005372766754589975, -0.0004915137542411685, -0.0004457508330233395, -0.0003999879118055105, -0.00035422499058768153, -0.00030846206936985254, -0.00026269914815202355, -0.00021693622693419456, -0.00017117330571636558, -0.0001254103844985366, -7.96474632807076e-05, -3.388454206287861e-05, 1.187837915495038e-05, 5.764130037277937e-05, 0.00010340422159060836, 0.00014916714280843735, 0.00019493006402626634, 0.00024069298524409533, 0.0002864559064619243, 0.0003322188276797533, 0.0003779817488975823, 0.0004237447865307331, 0.0004695077077485621, 0.0005152706289663911, 0.0005610335501842201, 0.0006067964714020491, 0.000652559392619878, 0.000698322313837707, 0.000744085235055536, 0.000789848156273365, 0.000835611077491194, 0.000881373998709023, 0.000927136919926852, 0.000972899841144681, 0.001018662704154849, 0.001064425683580339, 0.0011101886630058289, 0.001155951526015997, 0.001201714389026165, 0.001247477368451655, 0.0012932403478771448, 0.0013390032108873129, 0.001384766073897481, 0.0014305290533229709, 0.0014762920327484608, 0.0015220548957586288, 0.001567817758768797, 0.0016135807381942868, 0.0016593437176197767, 0.0017051065806299448, 0.0017508694436401129, 0.0017966324230656028, 0.0018423954024910927, 0.0018881582655012608]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 9.0, 4.0, 5.0, 12.0, 14.0, 15.0, 21.0, 17.0, 20.0, 22.0, 24.0, 20.0, 36.0, 39.0, 36.0, 27.0, 29.0, 31.0, 31.0, 36.0, 33.0, 45.0, 41.0, 41.0, 30.0, 26.0, 32.0, 33.0, 32.0, 28.0, 19.0, 23.0, 24.0, 14.0, 21.0, 15.0, 12.0, 15.0, 15.0, 4.0, 10.0, 5.0, 5.0, 3.0, 4.0, 6.0, 1.0, 3.0, 2.0, 5.0, 3.0], "bins": [-0.0001995563507080078, -0.00019373930990695953, -0.00018792226910591125, -0.00018210522830486298, -0.0001762881875038147, -0.00017047114670276642, -0.00016465410590171814, -0.00015883706510066986, -0.00015302002429962158, -0.0001472029834985733, -0.00014138594269752502, -0.00013556890189647675, -0.00012975186109542847, -0.0001239348202943802, -0.00011811777949333191, -0.00011230073869228363, -0.00010648369789123535, -0.00010066665709018707, -9.48496162891388e-05, -8.903257548809052e-05, -8.321553468704224e-05, -7.739849388599396e-05, -7.158145308494568e-05, -6.57644122838974e-05, -5.994737148284912e-05, -5.413033068180084e-05, -4.8313289880752563e-05, -4.2496249079704285e-05, -3.6679208278656006e-05, -3.086216747760773e-05, -2.5045126676559448e-05, -1.922808587551117e-05, -1.341104507446289e-05, -7.594004273414612e-06, -1.776963472366333e-06, 4.040077328681946e-06, 9.857118129730225e-06, 1.5674158930778503e-05, 2.1491199731826782e-05, 2.730824053287506e-05, 3.312528133392334e-05, 3.894232213497162e-05, 4.47593629360199e-05, 5.0576403737068176e-05, 5.6393444538116455e-05, 6.221048533916473e-05, 6.802752614021301e-05, 7.384456694126129e-05, 7.966160774230957e-05, 8.547864854335785e-05, 9.129568934440613e-05, 9.71127301454544e-05, 0.00010292977094650269, 0.00010874681174755096, 0.00011456385254859924, 0.00012038089334964752, 0.0001261979341506958, 0.00013201497495174408, 0.00013783201575279236, 0.00014364905655384064, 0.00014946609735488892, 0.0001552831381559372, 0.00016110017895698547, 0.00016691721975803375, 0.00017273426055908203]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 10.0, 11.0, 14.0, 14.0, 15.0, 27.0, 16.0, 16.0, 19.0, 34.0, 36.0, 24.0, 28.0, 44.0, 38.0, 44.0, 34.0, 37.0, 33.0, 42.0, 39.0, 39.0, 37.0, 38.0, 36.0, 29.0, 36.0, 29.0, 20.0, 16.0, 19.0, 18.0, 24.0, 17.0, 11.0, 7.0, 7.0, 14.0, 6.0, 3.0, 4.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.76177978515625, -2.6719970703125, -2.58221435546875, -2.492431640625, -2.40264892578125, -2.3128662109375, -2.22308349609375, -2.13330078125, -2.04351806640625, -1.9537353515625, -1.86395263671875, -1.774169921875, -1.68438720703125, -1.5946044921875, -1.50482177734375, -1.4150390625, -1.32525634765625, -1.2354736328125, -1.14569091796875, -1.055908203125, -0.96612548828125, -0.8763427734375, -0.78656005859375, -0.69677734375, -0.60699462890625, -0.5172119140625, -0.42742919921875, -0.337646484375, -0.24786376953125, -0.1580810546875, -0.06829833984375, 0.021484375, 0.11126708984375, 0.2010498046875, 0.29083251953125, 0.380615234375, 0.47039794921875, 0.5601806640625, 0.64996337890625, 0.73974609375, 0.82952880859375, 0.9193115234375, 1.00909423828125, 1.098876953125, 1.18865966796875, 1.2784423828125, 1.36822509765625, 1.4580078125, 1.54779052734375, 1.6375732421875, 1.72735595703125, 1.817138671875, 1.90692138671875, 1.9967041015625, 2.08648681640625, 2.17626953125, 2.26605224609375, 2.3558349609375, 2.44561767578125, 2.535400390625, 2.62518310546875, 2.7149658203125, 2.80474853515625, 2.89453125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 1.0, 9.0, 14.0, 13.0, 24.0, 24.0, 47.0, 51.0, 67.0, 103.0, 102.0, 177.0, 245.0, 401.0, 705.0, 1328.0, 2677.0, 5535.0, 13060.0, 30777.0, 74208.0, 171382.0, 373984.0, 212173.0, 92397.0, 38601.0, 16359.0, 7071.0, 3228.0, 1583.0, 815.0, 423.0, 269.0, 170.0, 119.0, 115.0, 82.0, 58.0, 37.0, 31.0, 21.0, 22.0, 11.0, 7.0, 9.0, 6.0, 8.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.751953125, -2.664947509765625, -2.57794189453125, -2.490936279296875, -2.4039306640625, -2.316925048828125, -2.22991943359375, -2.142913818359375, -2.055908203125, -1.968902587890625, -1.88189697265625, -1.794891357421875, -1.7078857421875, -1.620880126953125, -1.53387451171875, -1.446868896484375, -1.35986328125, -1.272857666015625, -1.18585205078125, -1.098846435546875, -1.0118408203125, -0.924835205078125, -0.83782958984375, -0.750823974609375, -0.663818359375, -0.576812744140625, -0.48980712890625, -0.402801513671875, -0.3157958984375, -0.228790283203125, -0.14178466796875, -0.054779052734375, 0.0322265625, 0.119232177734375, 0.20623779296875, 0.293243408203125, 0.3802490234375, 0.467254638671875, 0.55426025390625, 0.641265869140625, 0.728271484375, 0.815277099609375, 0.90228271484375, 0.989288330078125, 1.0762939453125, 1.163299560546875, 1.25030517578125, 1.337310791015625, 1.42431640625, 1.511322021484375, 1.59832763671875, 1.685333251953125, 1.7723388671875, 1.859344482421875, 1.94635009765625, 2.033355712890625, 2.120361328125, 2.207366943359375, 2.29437255859375, 2.381378173828125, 2.4683837890625, 2.555389404296875, 2.64239501953125, 2.729400634765625, 2.81640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 3.0, 10.0, 7.0, 8.0, 13.0, 12.0, 16.0, 15.0, 21.0, 29.0, 18.0, 32.0, 35.0, 38.0, 44.0, 43.0, 56.0, 99.0, 234.0, 1512.0, 283.0, 76.0, 60.0, 53.0, 40.0, 27.0, 25.0, 37.0, 27.0, 22.0, 25.0, 23.0, 14.0, 11.0, 9.0, 15.0, 7.0, 10.0, 3.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.3671875, -10.028076171875, -9.68896484375, -9.349853515625, -9.0107421875, -8.671630859375, -8.33251953125, -7.993408203125, -7.654296875, -7.315185546875, -6.97607421875, -6.636962890625, -6.2978515625, -5.958740234375, -5.61962890625, -5.280517578125, -4.94140625, -4.602294921875, -4.26318359375, -3.924072265625, -3.5849609375, -3.245849609375, -2.90673828125, -2.567626953125, -2.228515625, -1.889404296875, -1.55029296875, -1.211181640625, -0.8720703125, -0.532958984375, -0.19384765625, 0.145263671875, 0.484375, 0.823486328125, 1.16259765625, 1.501708984375, 1.8408203125, 2.179931640625, 2.51904296875, 2.858154296875, 3.197265625, 3.536376953125, 3.87548828125, 4.214599609375, 4.5537109375, 4.892822265625, 5.23193359375, 5.571044921875, 5.91015625, 6.249267578125, 6.58837890625, 6.927490234375, 7.2666015625, 7.605712890625, 7.94482421875, 8.283935546875, 8.623046875, 8.962158203125, 9.30126953125, 9.640380859375, 9.9794921875, 10.318603515625, 10.65771484375, 10.996826171875, 11.3359375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 15.0, 12.0, 16.0, 25.0, 33.0, 49.0, 74.0, 124.0, 179.0, 381.0, 1402.0, 1727101.0, 1413984.0, 1332.0, 403.0, 204.0, 104.0, 80.0, 48.0, 41.0, 33.0, 19.0, 11.0, 8.0, 8.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.5, -69.5673828125, -67.634765625, -65.7021484375, -63.76953125, -61.8369140625, -59.904296875, -57.9716796875, -56.0390625, -54.1064453125, -52.173828125, -50.2412109375, -48.30859375, -46.3759765625, -44.443359375, -42.5107421875, -40.578125, -38.6455078125, -36.712890625, -34.7802734375, -32.84765625, -30.9150390625, -28.982421875, -27.0498046875, -25.1171875, -23.1845703125, -21.251953125, -19.3193359375, -17.38671875, -15.4541015625, -13.521484375, -11.5888671875, -9.65625, -7.7236328125, -5.791015625, -3.8583984375, -1.92578125, 0.0068359375, 1.939453125, 3.8720703125, 5.8046875, 7.7373046875, 9.669921875, 11.6025390625, 13.53515625, 15.4677734375, 17.400390625, 19.3330078125, 21.265625, 23.1982421875, 25.130859375, 27.0634765625, 28.99609375, 30.9287109375, 32.861328125, 34.7939453125, 36.7265625, 38.6591796875, 40.591796875, 42.5244140625, 44.45703125, 46.3896484375, 48.322265625, 50.2548828125, 52.1875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 38.0, 165.0, 292.0, 318.0, 149.0, 37.0, 9.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66176700592041, -5.574765682220459, -4.487764358520508, -3.4007625579833984, -2.3137612342834473, -1.226759910583496, -0.13975811004638672, 0.9472432136535645, 2.0342445373535156, 3.121245861053467, 4.208247184753418, 5.295248985290527, 6.3822503089904785, 7.46925163269043, 8.556253433227539, 9.643255233764648, 10.730256080627441, 11.81725788116455, 12.904258728027344, 13.991260528564453, 15.078262329101562, 16.165264129638672, 17.25226593017578, 18.339265823364258, 19.426267623901367, 20.513269424438477, 21.600271224975586, 22.687271118164062, 23.774272918701172, 24.86127471923828, 25.94827651977539, 27.0352783203125, 28.12228012084961, 29.20928192138672, 30.296283721923828, 31.383285522460938, 32.47028732299805, 33.557289123535156, 34.644287109375, 35.73128890991211, 36.81829071044922, 37.90529251098633, 38.99229431152344, 40.07929611206055, 41.166297912597656, 42.2532958984375, 43.340301513671875, 44.42729949951172, 45.514305114746094, 46.6013069152832, 47.68830871582031, 48.77531051635742, 49.86231231689453, 50.949310302734375, 52.03631591796875, 53.123313903808594, 54.2103157043457, 55.29731750488281, 56.38431930541992, 57.47132110595703, 58.55832290649414, 59.64532470703125, 60.732322692871094, 61.8193244934082, 62.90632629394531]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 3.0, 4.0, 5.0, 7.0, 8.0, 6.0, 7.0, 12.0, 15.0, 10.0, 28.0, 22.0, 20.0, 20.0, 26.0, 31.0, 33.0, 37.0, 34.0, 36.0, 41.0, 41.0, 47.0, 34.0, 43.0, 43.0, 39.0, 30.0, 24.0, 42.0, 38.0, 33.0, 31.0, 27.0, 23.0, 16.0, 15.0, 16.0, 14.0, 13.0, 10.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.7840576171875, -20.971065521240234, -20.1580753326416, -19.345083236694336, -18.532093048095703, -17.719100952148438, -16.906108856201172, -16.093116760253906, -15.280126571655273, -14.467135429382324, -13.654144287109375, -12.84115219116211, -12.02816104888916, -11.215169906616211, -10.402177810668945, -9.589186668395996, -8.776195526123047, -7.963204383850098, -7.15021276473999, -6.337221145629883, -5.524230003356934, -4.711238861083984, -3.898247241973877, -3.0852556228637695, -2.2722644805908203, -1.459273099899292, -0.6462817192077637, 0.16670966148376465, 0.979701042175293, 1.7926921844482422, 2.6056838035583496, 3.418675422668457, 4.231666564941406, 5.0446577072143555, 5.857649326324463, 6.67064094543457, 7.4836320877075195, 8.296623229980469, 9.109615325927734, 9.922606468200684, 10.735597610473633, 11.548588752746582, 12.361579895019531, 13.174571990966797, 13.987563133239746, 14.800554275512695, 15.613546371459961, 16.426536560058594, 17.23952865600586, 18.052520751953125, 18.865510940551758, 19.678503036499023, 20.491493225097656, 21.304485321044922, 22.117477416992188, 22.930469512939453, 23.743459701538086, 24.55645179748535, 25.369441986083984, 26.18243408203125, 26.995426177978516, 27.80841636657715, 28.621408462524414, 29.434398651123047, 30.247390747070312]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 11.0, 8.0, 11.0, 19.0, 7.0, 19.0, 22.0, 26.0, 16.0, 27.0, 28.0, 31.0, 27.0, 40.0, 32.0, 37.0, 32.0, 36.0, 39.0, 37.0, 42.0, 40.0, 36.0, 40.0, 35.0, 38.0, 38.0, 32.0, 23.0, 24.0, 22.0, 12.0, 14.0, 19.0, 13.0, 12.0, 8.0, 15.0, 11.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.116058349609375, -3.01727294921875, -2.918487548828125, -2.8197021484375, -2.720916748046875, -2.62213134765625, -2.523345947265625, -2.424560546875, -2.325775146484375, -2.22698974609375, -2.128204345703125, -2.0294189453125, -1.930633544921875, -1.83184814453125, -1.733062744140625, -1.63427734375, -1.535491943359375, -1.43670654296875, -1.337921142578125, -1.2391357421875, -1.140350341796875, -1.04156494140625, -0.942779541015625, -0.843994140625, -0.745208740234375, -0.64642333984375, -0.547637939453125, -0.4488525390625, -0.350067138671875, -0.25128173828125, -0.152496337890625, -0.0537109375, 0.045074462890625, 0.14385986328125, 0.242645263671875, 0.3414306640625, 0.440216064453125, 0.53900146484375, 0.637786865234375, 0.736572265625, 0.835357666015625, 0.93414306640625, 1.032928466796875, 1.1317138671875, 1.230499267578125, 1.32928466796875, 1.428070068359375, 1.52685546875, 1.625640869140625, 1.72442626953125, 1.823211669921875, 1.9219970703125, 2.020782470703125, 2.11956787109375, 2.218353271484375, 2.317138671875, 2.415924072265625, 2.51470947265625, 2.613494873046875, 2.7122802734375, 2.811065673828125, 2.90985107421875, 3.008636474609375, 3.107421875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 11.0, 14.0, 14.0, 24.0, 23.0, 39.0, 44.0, 44.0, 54.0, 63.0, 74.0, 94.0, 124.0, 167.0, 342.0, 699.0, 3017.0, 32336.0, 598964.0, 2567670.0, 927391.0, 56354.0, 4565.0, 926.0, 391.0, 199.0, 134.0, 100.0, 78.0, 35.0, 47.0, 38.0, 33.0, 27.0, 26.0, 26.0, 19.0, 19.0, 13.0, 8.0, 4.0, 11.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.515625, -7.2850341796875, -7.054443359375, -6.8238525390625, -6.59326171875, -6.3626708984375, -6.132080078125, -5.9014892578125, -5.6708984375, -5.4403076171875, -5.209716796875, -4.9791259765625, -4.74853515625, -4.5179443359375, -4.287353515625, -4.0567626953125, -3.826171875, -3.5955810546875, -3.364990234375, -3.1343994140625, -2.90380859375, -2.6732177734375, -2.442626953125, -2.2120361328125, -1.9814453125, -1.7508544921875, -1.520263671875, -1.2896728515625, -1.05908203125, -0.8284912109375, -0.597900390625, -0.3673095703125, -0.13671875, 0.0938720703125, 0.324462890625, 0.5550537109375, 0.78564453125, 1.0162353515625, 1.246826171875, 1.4774169921875, 1.7080078125, 1.9385986328125, 2.169189453125, 2.3997802734375, 2.63037109375, 2.8609619140625, 3.091552734375, 3.3221435546875, 3.552734375, 3.7833251953125, 4.013916015625, 4.2445068359375, 4.47509765625, 4.7056884765625, 4.936279296875, 5.1668701171875, 5.3974609375, 5.6280517578125, 5.858642578125, 6.0892333984375, 6.31982421875, 6.5504150390625, 6.781005859375, 7.0115966796875, 7.2421875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 5.0, 8.0, 12.0, 10.0, 18.0, 24.0, 29.0, 27.0, 58.0, 70.0, 71.0, 98.0, 157.0, 151.0, 193.0, 277.0, 299.0, 364.0, 384.0, 347.0, 311.0, 258.0, 183.0, 154.0, 127.0, 92.0, 73.0, 54.0, 41.0, 40.0, 26.0, 29.0, 16.0, 13.0, 8.0, 7.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-5.875, -5.70941162109375, -5.5438232421875, -5.37823486328125, -5.212646484375, -5.04705810546875, -4.8814697265625, -4.71588134765625, -4.55029296875, -4.38470458984375, -4.2191162109375, -4.05352783203125, -3.887939453125, -3.72235107421875, -3.5567626953125, -3.39117431640625, -3.2255859375, -3.05999755859375, -2.8944091796875, -2.72882080078125, -2.563232421875, -2.39764404296875, -2.2320556640625, -2.06646728515625, -1.90087890625, -1.73529052734375, -1.5697021484375, -1.40411376953125, -1.238525390625, -1.07293701171875, -0.9073486328125, -0.74176025390625, -0.576171875, -0.41058349609375, -0.2449951171875, -0.07940673828125, 0.086181640625, 0.25177001953125, 0.4173583984375, 0.58294677734375, 0.74853515625, 0.91412353515625, 1.0797119140625, 1.24530029296875, 1.410888671875, 1.57647705078125, 1.7420654296875, 1.90765380859375, 2.0732421875, 2.23883056640625, 2.4044189453125, 2.57000732421875, 2.735595703125, 2.90118408203125, 3.0667724609375, 3.23236083984375, 3.39794921875, 3.56353759765625, 3.7291259765625, 3.89471435546875, 4.060302734375, 4.22589111328125, 4.3914794921875, 4.55706787109375, 4.72265625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 7.0, 6.0, 9.0, 12.0, 13.0, 17.0, 24.0, 36.0, 42.0, 38.0, 63.0, 85.0, 111.0, 162.0, 239.0, 317.0, 459.0, 1483.0, 179444.0, 3979257.0, 30054.0, 878.0, 407.0, 255.0, 218.0, 150.0, 108.0, 97.0, 76.0, 59.0, 36.0, 22.0, 23.0, 20.0, 11.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.111083984375, -21.33154296875, -20.552001953125, -19.7724609375, -18.992919921875, -18.21337890625, -17.433837890625, -16.654296875, -15.874755859375, -15.09521484375, -14.315673828125, -13.5361328125, -12.756591796875, -11.97705078125, -11.197509765625, -10.41796875, -9.638427734375, -8.85888671875, -8.079345703125, -7.2998046875, -6.520263671875, -5.74072265625, -4.961181640625, -4.181640625, -3.402099609375, -2.62255859375, -1.843017578125, -1.0634765625, -0.283935546875, 0.49560546875, 1.275146484375, 2.0546875, 2.834228515625, 3.61376953125, 4.393310546875, 5.1728515625, 5.952392578125, 6.73193359375, 7.511474609375, 8.291015625, 9.070556640625, 9.85009765625, 10.629638671875, 11.4091796875, 12.188720703125, 12.96826171875, 13.747802734375, 14.52734375, 15.306884765625, 16.08642578125, 16.865966796875, 17.6455078125, 18.425048828125, 19.20458984375, 19.984130859375, 20.763671875, 21.543212890625, 22.32275390625, 23.102294921875, 23.8818359375, 24.661376953125, 25.44091796875, 26.220458984375, 27.0]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 48.0, 340.0, 448.0, 160.0, 13.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03895950317383, -29.493732452392578, -25.948505401611328, -22.403278350830078, -18.858051300048828, -15.312822341918945, -11.767595291137695, -8.222368240356445, -4.677141189575195, -1.1319139003753662, 2.413313388824463, 5.958540916442871, 9.503767967224121, 13.048995971679688, 16.594223022460938, 20.139450073242188, 23.684677124023438, 27.229904174804688, 30.775131225585938, 34.32035827636719, 37.86558532714844, 41.41081237792969, 44.95603942871094, 48.50126647949219, 52.04649353027344, 55.59172058105469, 59.13694763183594, 62.68217468261719, 66.22740173339844, 69.77262878417969, 73.31785583496094, 76.86308288574219, 80.40831756591797, 83.95354461669922, 87.49877166748047, 91.04399871826172, 94.58922576904297, 98.13445281982422, 101.67967987060547, 105.22490692138672, 108.77013397216797, 112.31536102294922, 115.86058807373047, 119.40581512451172, 122.95104217529297, 126.49626922607422, 130.04150390625, 133.58673095703125, 137.1319580078125, 140.67718505859375, 144.222412109375, 147.76763916015625, 151.3128662109375, 154.85809326171875, 158.4033203125, 161.94854736328125, 165.4937744140625, 169.03900146484375, 172.584228515625, 176.12945556640625, 179.6746826171875, 183.21990966796875, 186.76513671875, 190.31036376953125, 193.8555908203125]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 10.0, 14.0, 12.0, 21.0, 21.0, 18.0, 29.0, 16.0, 18.0, 37.0, 27.0, 27.0, 29.0, 45.0, 43.0, 43.0, 42.0, 38.0, 49.0, 40.0, 47.0, 39.0, 32.0, 38.0, 37.0, 23.0, 28.0, 25.0, 20.0, 18.0, 16.0, 14.0, 15.0, 12.0, 10.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.97812271118164, -20.312986373901367, -19.647851943969727, -18.982715606689453, -18.31757926940918, -17.65244483947754, -16.987308502197266, -16.322174072265625, -15.657037734985352, -14.991902351379395, -14.326766014099121, -13.661630630493164, -12.996495246887207, -12.33135986328125, -11.666223526000977, -11.00108814239502, -10.335951805114746, -9.670816421508789, -9.005680084228516, -8.340544700622559, -7.675409317016602, -7.010273456573486, -6.345137596130371, -5.680002212524414, -5.014866352081299, -4.349730491638184, -3.6845951080322266, -3.0194592475891113, -2.354323625564575, -1.689188003540039, -1.0240521430969238, -0.3589167594909668, 0.30621910095214844, 0.9713547825813293, 1.6364904642105103, 2.301626205444336, 2.966761827468872, 3.631897449493408, 4.297033309936523, 4.9621686935424805, 5.627304553985596, 6.292440414428711, 6.957575798034668, 7.622711658477783, 8.287847518920898, 8.952982902526855, 9.618118286132812, 10.283254623413086, 10.948390007019043, 11.613525390625, 12.278661727905273, 12.94379711151123, 13.608932495117188, 14.274068832397461, 14.939204216003418, 15.604339599609375, 16.26947593688965, 16.934612274169922, 17.599746704101562, 18.264883041381836, 18.93001937866211, 19.59515380859375, 20.260290145874023, 20.925426483154297, 21.590560913085938]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 9.0, 9.0, 10.0, 11.0, 11.0, 16.0, 20.0, 26.0, 21.0, 22.0, 26.0, 22.0, 35.0, 29.0, 31.0, 33.0, 43.0, 32.0, 47.0, 44.0, 41.0, 43.0, 38.0, 41.0, 37.0, 37.0, 31.0, 26.0, 25.0, 25.0, 24.0, 14.0, 23.0, 23.0, 22.0, 7.0, 7.0, 5.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.892425537109375, -2.79852294921875, -2.704620361328125, -2.6107177734375, -2.516815185546875, -2.42291259765625, -2.329010009765625, -2.235107421875, -2.141204833984375, -2.04730224609375, -1.953399658203125, -1.8594970703125, -1.765594482421875, -1.67169189453125, -1.577789306640625, -1.48388671875, -1.389984130859375, -1.29608154296875, -1.202178955078125, -1.1082763671875, -1.014373779296875, -0.92047119140625, -0.826568603515625, -0.732666015625, -0.638763427734375, -0.54486083984375, -0.450958251953125, -0.3570556640625, -0.263153076171875, -0.16925048828125, -0.075347900390625, 0.0185546875, 0.112457275390625, 0.20635986328125, 0.300262451171875, 0.3941650390625, 0.488067626953125, 0.58197021484375, 0.675872802734375, 0.769775390625, 0.863677978515625, 0.95758056640625, 1.051483154296875, 1.1453857421875, 1.239288330078125, 1.33319091796875, 1.427093505859375, 1.52099609375, 1.614898681640625, 1.70880126953125, 1.802703857421875, 1.8966064453125, 1.990509033203125, 2.08441162109375, 2.178314208984375, 2.272216796875, 2.366119384765625, 2.46002197265625, 2.553924560546875, 2.6478271484375, 2.741729736328125, 2.83563232421875, 2.929534912109375, 3.0234375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 10.0, 28.0, 31.0, 45.0, 49.0, 88.0, 128.0, 161.0, 226.0, 340.0, 486.0, 693.0, 983.0, 1409.0, 2027.0, 3035.0, 4470.0, 6369.0, 9326.0, 13735.0, 20403.0, 30290.0, 47389.0, 77297.0, 140666.0, 259590.0, 175258.0, 92252.0, 54743.0, 34735.0, 23021.0, 15595.0, 10592.0, 7172.0, 4969.0, 3331.0, 2298.0, 1608.0, 1151.0, 757.0, 549.0, 385.0, 247.0, 166.0, 141.0, 94.0, 56.0, 52.0, 31.0, 26.0, 16.0, 10.0, 8.0, 8.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.485595703125, -0.4702568054199219, -0.45491790771484375, -0.4395790100097656, -0.4242401123046875, -0.4089012145996094, -0.39356231689453125, -0.3782234191894531, -0.362884521484375, -0.3475456237792969, -0.33220672607421875, -0.3168678283691406, -0.3015289306640625, -0.2861900329589844, -0.27085113525390625, -0.2555122375488281, -0.24017333984375, -0.22483444213867188, -0.20949554443359375, -0.19415664672851562, -0.1788177490234375, -0.16347885131835938, -0.14813995361328125, -0.13280105590820312, -0.117462158203125, -0.10212326049804688, -0.08678436279296875, -0.07144546508789062, -0.0561065673828125, -0.040767669677734375, -0.02542877197265625, -0.010089874267578125, 0.0052490234375, 0.020587921142578125, 0.03592681884765625, 0.051265716552734375, 0.0666046142578125, 0.08194351196289062, 0.09728240966796875, 0.11262130737304688, 0.127960205078125, 0.14329910278320312, 0.15863800048828125, 0.17397689819335938, 0.1893157958984375, 0.20465469360351562, 0.21999359130859375, 0.23533248901367188, 0.25067138671875, 0.2660102844238281, 0.28134918212890625, 0.2966880798339844, 0.3120269775390625, 0.3273658752441406, 0.34270477294921875, 0.3580436706542969, 0.373382568359375, 0.3887214660644531, 0.40406036376953125, 0.4193992614746094, 0.4347381591796875, 0.4500770568847656, 0.46541595458984375, 0.4807548522949219, 0.49609375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 1.0, 7.0, 4.0, 4.0, 9.0, 7.0, 12.0, 20.0, 11.0, 19.0, 18.0, 12.0, 20.0, 23.0, 15.0, 26.0, 41.0, 37.0, 36.0, 37.0, 42.0, 33.0, 40.0, 1064.0, 38.0, 51.0, 33.0, 39.0, 38.0, 34.0, 30.0, 28.0, 37.0, 24.0, 33.0, 20.0, 20.0, 9.0, 7.0, 10.0, 9.0, 2.0, 8.0, 12.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6103515625, -1.5503692626953125, -1.490386962890625, -1.4304046630859375, -1.37042236328125, -1.3104400634765625, -1.250457763671875, -1.1904754638671875, -1.1304931640625, -1.0705108642578125, -1.010528564453125, -0.9505462646484375, -0.89056396484375, -0.8305816650390625, -0.770599365234375, -0.7106170654296875, -0.650634765625, -0.5906524658203125, -0.530670166015625, -0.4706878662109375, -0.41070556640625, -0.3507232666015625, -0.290740966796875, -0.2307586669921875, -0.1707763671875, -0.1107940673828125, -0.050811767578125, 0.0091705322265625, 0.06915283203125, 0.1291351318359375, 0.189117431640625, 0.2490997314453125, 0.30908203125, 0.3690643310546875, 0.429046630859375, 0.4890289306640625, 0.54901123046875, 0.6089935302734375, 0.668975830078125, 0.7289581298828125, 0.7889404296875, 0.8489227294921875, 0.908905029296875, 0.9688873291015625, 1.02886962890625, 1.0888519287109375, 1.148834228515625, 1.2088165283203125, 1.268798828125, 1.3287811279296875, 1.388763427734375, 1.4487457275390625, 1.50872802734375, 1.5687103271484375, 1.628692626953125, 1.6886749267578125, 1.7486572265625, 1.8086395263671875, 1.868621826171875, 1.9286041259765625, 1.98858642578125, 2.0485687255859375, 2.108551025390625, 2.1685333251953125, 2.228515625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 10.0, 9.0, 8.0, 20.0, 21.0, 40.0, 64.0, 115.0, 148.0, 221.0, 394.0, 571.0, 866.0, 1230.0, 1871.0, 2716.0, 4013.0, 6053.0, 9267.0, 14453.0, 23339.0, 37949.0, 65605.0, 124167.0, 1323091.0, 225649.0, 105287.0, 56947.0, 33597.0, 20668.0, 13314.0, 8584.0, 5668.0, 3869.0, 2463.0, 1683.0, 1094.0, 737.0, 458.0, 287.0, 209.0, 122.0, 93.0, 57.0, 41.0, 17.0, 14.0, 17.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.49267578125, -0.475616455078125, -0.45855712890625, -0.441497802734375, -0.4244384765625, -0.407379150390625, -0.39031982421875, -0.373260498046875, -0.356201171875, -0.339141845703125, -0.32208251953125, -0.305023193359375, -0.2879638671875, -0.270904541015625, -0.25384521484375, -0.236785888671875, -0.2197265625, -0.202667236328125, -0.18560791015625, -0.168548583984375, -0.1514892578125, -0.134429931640625, -0.11737060546875, -0.100311279296875, -0.083251953125, -0.066192626953125, -0.04913330078125, -0.032073974609375, -0.0150146484375, 0.002044677734375, 0.01910400390625, 0.036163330078125, 0.05322265625, 0.070281982421875, 0.08734130859375, 0.104400634765625, 0.1214599609375, 0.138519287109375, 0.15557861328125, 0.172637939453125, 0.189697265625, 0.206756591796875, 0.22381591796875, 0.240875244140625, 0.2579345703125, 0.274993896484375, 0.29205322265625, 0.309112548828125, 0.326171875, 0.343231201171875, 0.36029052734375, 0.377349853515625, 0.3944091796875, 0.411468505859375, 0.42852783203125, 0.445587158203125, 0.462646484375, 0.479705810546875, 0.49676513671875, 0.513824462890625, 0.5308837890625, 0.547943115234375, 0.56500244140625, 0.582061767578125, 0.59912109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 4.0, 6.0, 9.0, 10.0, 8.0, 17.0, 21.0, 22.0, 17.0, 32.0, 37.0, 37.0, 34.0, 45.0, 48.0, 55.0, 50.0, 57.0, 46.0, 57.0, 55.0, 41.0, 38.0, 46.0, 31.0, 31.0, 39.0, 19.0, 13.0, 16.0, 13.0, 10.0, 7.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000232696533203125, -0.0002246946096420288, -0.00021669268608093262, -0.00020869076251983643, -0.00020068883895874023, -0.00019268691539764404, -0.00018468499183654785, -0.00017668306827545166, -0.00016868114471435547, -0.00016067922115325928, -0.00015267729759216309, -0.0001446753740310669, -0.0001366734504699707, -0.0001286715269088745, -0.00012066960334777832, -0.00011266767978668213, -0.00010466575622558594, -9.666383266448975e-05, -8.866190910339355e-05, -8.065998554229736e-05, -7.265806198120117e-05, -6.465613842010498e-05, -5.665421485900879e-05, -4.86522912979126e-05, -4.0650367736816406e-05, -3.2648444175720215e-05, -2.4646520614624023e-05, -1.6644597053527832e-05, -8.64267349243164e-06, -6.407499313354492e-07, 7.361173629760742e-06, 1.5363097190856934e-05, 2.3365020751953125e-05, 3.1366944313049316e-05, 3.936886787414551e-05, 4.73707914352417e-05, 5.537271499633789e-05, 6.337463855743408e-05, 7.137656211853027e-05, 7.937848567962646e-05, 8.738040924072266e-05, 9.538233280181885e-05, 0.00010338425636291504, 0.00011138617992401123, 0.00011938810348510742, 0.0001273900270462036, 0.0001353919506072998, 0.000143393874168396, 0.0001513957977294922, 0.00015939772129058838, 0.00016739964485168457, 0.00017540156841278076, 0.00018340349197387695, 0.00019140541553497314, 0.00019940733909606934, 0.00020740926265716553, 0.00021541118621826172, 0.0002234131097793579, 0.0002314150333404541, 0.0002394169569015503, 0.0002474188804626465, 0.0002554208040237427, 0.00026342272758483887, 0.00027142465114593506, 0.00027942657470703125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 7.0, 15.0, 19.0, 23.0, 25.0, 45.0, 51.0, 59.0, 76.0, 92.0, 125.0, 254.0, 513.0, 1477.0, 415731.0, 626699.0, 1806.0, 572.0, 271.0, 173.0, 110.0, 77.0, 61.0, 45.0, 51.0, 30.0, 29.0, 27.0, 14.0, 13.0, 9.0, 6.0, 11.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.006122589111328125, -0.005952715873718262, -0.0057828426361083984, -0.005612969398498535, -0.005443096160888672, -0.005273222923278809, -0.005103349685668945, -0.004933476448059082, -0.004763603210449219, -0.0045937299728393555, -0.004423856735229492, -0.004253983497619629, -0.004084110260009766, -0.003914237022399902, -0.003744363784790039, -0.0035744905471801758, -0.0034046173095703125, -0.0032347440719604492, -0.003064870834350586, -0.0028949975967407227, -0.0027251243591308594, -0.002555251121520996, -0.002385377883911133, -0.0022155046463012695, -0.0020456314086914062, -0.001875758171081543, -0.0017058849334716797, -0.0015360116958618164, -0.0013661384582519531, -0.0011962652206420898, -0.0010263919830322266, -0.0008565187454223633, -0.0006866455078125, -0.0005167722702026367, -0.00034689903259277344, -0.00017702579498291016, -7.152557373046875e-06, 0.0001627206802368164, 0.0003325939178466797, 0.000502467155456543, 0.0006723403930664062, 0.0008422136306762695, 0.0010120868682861328, 0.001181960105895996, 0.0013518333435058594, 0.0015217065811157227, 0.001691579818725586, 0.0018614530563354492, 0.0020313262939453125, 0.0022011995315551758, 0.002371072769165039, 0.0025409460067749023, 0.0027108192443847656, 0.002880692481994629, 0.003050565719604492, 0.0032204389572143555, 0.0033903121948242188, 0.003560185432434082, 0.0037300586700439453, 0.0038999319076538086, 0.004069805145263672, 0.004239678382873535, 0.0044095516204833984, 0.004579424858093262, 0.004749298095703125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 19.0, 28.0, 34.0, 76.0, 120.0, 126.0, 130.0, 133.0, 127.0, 81.0, 49.0, 41.0, 14.0, 13.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00014169173664413393, -0.00013415678404271603, -0.00012662183144129813, -0.00011908687883988023, -0.00011155191896250471, -0.00010401696636108682, -9.648201375966892e-05, -8.89470538822934e-05, -8.14121012808755e-05, -7.38771486794576e-05, -6.63421960780397e-05, -5.8807239838643e-05, -5.127228359924629e-05, -4.3737330997828394e-05, -3.6202378396410495e-05, -2.866742215701379e-05, -2.1132473193574697e-05, -1.3597518773167394e-05, -6.062565262254793e-06, 1.4723882486578077e-06, 9.00734266906511e-06, 1.6542297089472413e-05, 2.4077249690890312e-05, 3.161220593028702e-05, 3.914715853170492e-05, 4.668211113312282e-05, 5.421706737251952e-05, 6.175201997393742e-05, 6.928697257535532e-05, 7.682193245273083e-05, 8.435688505414873e-05, 9.189183765556663e-05, 9.942679025698453e-05, 0.00010696174285840243, 0.00011449669545982033, 0.00012203164806123823, 0.00012956660066265613, 0.00013710156781598926, 0.00014463652041740716, 0.00015217147301882505, 0.00015970642562024295, 0.00016724137822166085, 0.00017477633082307875, 0.00018231128342449665, 0.00018984623602591455, 0.00019738118862733245, 0.00020491614122875035, 0.00021245110838208348, 0.00021998604643158615, 0.00022752099903300405, 0.00023505595163442194, 0.00024259090423583984, 0.00025012585683725774, 0.00025766080943867564, 0.00026519576204009354, 0.00027273071464151144, 0.0002802656963467598, 0.0002878006489481777, 0.0002953356015495956, 0.0003028705541510135, 0.0003104055067524314, 0.0003179404593538493, 0.0003254754119552672, 0.0003330103645566851, 0.000340545317158103]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 7.0, 4.0, 2.0, 5.0, 11.0, 15.0, 11.0, 19.0, 10.0, 24.0, 31.0, 47.0, 23.0, 30.0, 33.0, 40.0, 39.0, 39.0, 39.0, 42.0, 38.0, 42.0, 37.0, 39.0, 41.0, 33.0, 35.0, 30.0, 28.0, 33.0, 29.0, 16.0, 19.0, 23.0, 19.0, 13.0, 14.0, 8.0, 5.0, 10.0, 2.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00014823675155639648, -0.0001438213512301445, -0.00013940595090389252, -0.00013499055057764053, -0.00013057515025138855, -0.00012615974992513657, -0.00012174434959888458, -0.0001173289492726326, -0.00011291354894638062, -0.00010849814862012863, -0.00010408274829387665, -9.966734796762466e-05, -9.525194764137268e-05, -9.08365473151207e-05, -8.642114698886871e-05, -8.200574666261673e-05, -7.759034633636475e-05, -7.317494601011276e-05, -6.875954568386078e-05, -6.43441453576088e-05, -5.992874503135681e-05, -5.551334470510483e-05, -5.1097944378852844e-05, -4.668254405260086e-05, -4.226714372634888e-05, -3.785174340009689e-05, -3.343634307384491e-05, -2.9020942747592926e-05, -2.4605542421340942e-05, -2.019014209508896e-05, -1.5774741768836975e-05, -1.1359341442584991e-05, -6.943941116333008e-06, -2.528540790081024e-06, 1.8868595361709595e-06, 6.302259862422943e-06, 1.0717660188674927e-05, 1.513306051492691e-05, 1.9548460841178894e-05, 2.3963861167430878e-05, 2.837926149368286e-05, 3.2794661819934845e-05, 3.721006214618683e-05, 4.162546247243881e-05, 4.6040862798690796e-05, 5.045626312494278e-05, 5.487166345119476e-05, 5.928706377744675e-05, 6.370246410369873e-05, 6.811786442995071e-05, 7.25332647562027e-05, 7.694866508245468e-05, 8.136406540870667e-05, 8.577946573495865e-05, 9.019486606121063e-05, 9.461026638746262e-05, 9.90256667137146e-05, 0.00010344106703996658, 0.00010785646736621857, 0.00011227186769247055, 0.00011668726801872253, 0.00012110266834497452, 0.0001255180686712265, 0.00012993346899747849, 0.00013434886932373047]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 9.0, 9.0, 10.0, 11.0, 11.0, 16.0, 20.0, 26.0, 21.0, 22.0, 26.0, 22.0, 35.0, 29.0, 31.0, 33.0, 43.0, 32.0, 47.0, 44.0, 41.0, 43.0, 38.0, 41.0, 37.0, 37.0, 31.0, 26.0, 25.0, 25.0, 24.0, 14.0, 23.0, 23.0, 22.0, 7.0, 7.0, 5.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.892425537109375, -2.79852294921875, -2.704620361328125, -2.6107177734375, -2.516815185546875, -2.42291259765625, -2.329010009765625, -2.235107421875, -2.141204833984375, -2.04730224609375, -1.953399658203125, -1.8594970703125, -1.765594482421875, -1.67169189453125, -1.577789306640625, -1.48388671875, -1.389984130859375, -1.29608154296875, -1.202178955078125, -1.1082763671875, -1.014373779296875, -0.92047119140625, -0.826568603515625, -0.732666015625, -0.638763427734375, -0.54486083984375, -0.450958251953125, -0.3570556640625, -0.263153076171875, -0.16925048828125, -0.075347900390625, 0.0185546875, 0.112457275390625, 0.20635986328125, 0.300262451171875, 0.3941650390625, 0.488067626953125, 0.58197021484375, 0.675872802734375, 0.769775390625, 0.863677978515625, 0.95758056640625, 1.051483154296875, 1.1453857421875, 1.239288330078125, 1.33319091796875, 1.427093505859375, 1.52099609375, 1.614898681640625, 1.70880126953125, 1.802703857421875, 1.8966064453125, 1.990509033203125, 2.08441162109375, 2.178314208984375, 2.272216796875, 2.366119384765625, 2.46002197265625, 2.553924560546875, 2.6478271484375, 2.741729736328125, 2.83563232421875, 2.929534912109375, 3.0234375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 9.0, 10.0, 20.0, 23.0, 37.0, 56.0, 69.0, 112.0, 242.0, 452.0, 1027.0, 2129.0, 4464.0, 9401.0, 19415.0, 43619.0, 110736.0, 291262.0, 336562.0, 133614.0, 52083.0, 22587.0, 10619.0, 5173.0, 2425.0, 1115.0, 566.0, 280.0, 137.0, 81.0, 49.0, 38.0, 34.0, 26.0, 14.0, 11.0, 7.0, 6.0, 7.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.821014404296875, -2.72406005859375, -2.627105712890625, -2.5301513671875, -2.433197021484375, -2.33624267578125, -2.239288330078125, -2.142333984375, -2.045379638671875, -1.94842529296875, -1.851470947265625, -1.7545166015625, -1.657562255859375, -1.56060791015625, -1.463653564453125, -1.36669921875, -1.269744873046875, -1.17279052734375, -1.075836181640625, -0.9788818359375, -0.881927490234375, -0.78497314453125, -0.688018798828125, -0.591064453125, -0.494110107421875, -0.39715576171875, -0.300201416015625, -0.2032470703125, -0.106292724609375, -0.00933837890625, 0.087615966796875, 0.1845703125, 0.281524658203125, 0.37847900390625, 0.475433349609375, 0.5723876953125, 0.669342041015625, 0.76629638671875, 0.863250732421875, 0.960205078125, 1.057159423828125, 1.15411376953125, 1.251068115234375, 1.3480224609375, 1.444976806640625, 1.54193115234375, 1.638885498046875, 1.73583984375, 1.832794189453125, 1.92974853515625, 2.026702880859375, 2.1236572265625, 2.220611572265625, 2.31756591796875, 2.414520263671875, 2.511474609375, 2.608428955078125, 2.70538330078125, 2.802337646484375, 2.8992919921875, 2.996246337890625, 3.09320068359375, 3.190155029296875, 3.287109375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 9.0, 9.0, 12.0, 13.0, 13.0, 19.0, 33.0, 23.0, 35.0, 27.0, 34.0, 49.0, 51.0, 71.0, 150.0, 452.0, 1468.0, 146.0, 73.0, 52.0, 53.0, 42.0, 35.0, 29.0, 23.0, 16.0, 14.0, 23.0, 16.0, 10.0, 9.0, 3.0, 5.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.46875, -13.02001953125, -12.5712890625, -12.12255859375, -11.673828125, -11.22509765625, -10.7763671875, -10.32763671875, -9.87890625, -9.43017578125, -8.9814453125, -8.53271484375, -8.083984375, -7.63525390625, -7.1865234375, -6.73779296875, -6.2890625, -5.84033203125, -5.3916015625, -4.94287109375, -4.494140625, -4.04541015625, -3.5966796875, -3.14794921875, -2.69921875, -2.25048828125, -1.8017578125, -1.35302734375, -0.904296875, -0.45556640625, -0.0068359375, 0.44189453125, 0.890625, 1.33935546875, 1.7880859375, 2.23681640625, 2.685546875, 3.13427734375, 3.5830078125, 4.03173828125, 4.48046875, 4.92919921875, 5.3779296875, 5.82666015625, 6.275390625, 6.72412109375, 7.1728515625, 7.62158203125, 8.0703125, 8.51904296875, 8.9677734375, 9.41650390625, 9.865234375, 10.31396484375, 10.7626953125, 11.21142578125, 11.66015625, 12.10888671875, 12.5576171875, 13.00634765625, 13.455078125, 13.90380859375, 14.3525390625, 14.80126953125, 15.25]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 10.0, 7.0, 18.0, 16.0, 20.0, 26.0, 24.0, 40.0, 40.0, 40.0, 93.0, 127.0, 187.0, 325.0, 580.0, 2871.0, 3029789.0, 109090.0, 1086.0, 432.0, 261.0, 156.0, 120.0, 89.0, 56.0, 39.0, 34.0, 20.0, 28.0, 24.0, 11.0, 16.0, 9.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.90625, -37.6826171875, -36.458984375, -35.2353515625, -34.01171875, -32.7880859375, -31.564453125, -30.3408203125, -29.1171875, -27.8935546875, -26.669921875, -25.4462890625, -24.22265625, -22.9990234375, -21.775390625, -20.5517578125, -19.328125, -18.1044921875, -16.880859375, -15.6572265625, -14.43359375, -13.2099609375, -11.986328125, -10.7626953125, -9.5390625, -8.3154296875, -7.091796875, -5.8681640625, -4.64453125, -3.4208984375, -2.197265625, -0.9736328125, 0.25, 1.4736328125, 2.697265625, 3.9208984375, 5.14453125, 6.3681640625, 7.591796875, 8.8154296875, 10.0390625, 11.2626953125, 12.486328125, 13.7099609375, 14.93359375, 16.1572265625, 17.380859375, 18.6044921875, 19.828125, 21.0517578125, 22.275390625, 23.4990234375, 24.72265625, 25.9462890625, 27.169921875, 28.3935546875, 29.6171875, 30.8408203125, 32.064453125, 33.2880859375, 34.51171875, 35.7353515625, 36.958984375, 38.1826171875, 39.40625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 22.0, 148.0, 372.0, 331.0, 109.0, 20.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.757884979248047, -26.49295425415039, -25.228025436401367, -23.96309471130371, -22.698165893554688, -21.43323516845703, -20.168304443359375, -18.90337371826172, -17.638444900512695, -16.37351417541504, -15.108585357666016, -13.84365463256836, -12.57872486114502, -11.31379508972168, -10.048864364624023, -8.783934593200684, -7.519004821777344, -6.254075050354004, -4.989144802093506, -3.724214792251587, -2.459284782409668, -1.1943550109863281, 0.07057523727416992, 1.335505485534668, 2.600435256958008, 3.8653652667999268, 5.130295276641846, 6.395225524902344, 7.660155296325684, 8.925085067749023, 10.19001579284668, 11.45494556427002, 12.719871520996094, 13.984801292419434, 15.249731063842773, 16.51466178894043, 17.779590606689453, 19.04452133178711, 20.309452056884766, 21.574382781982422, 22.839311599731445, 24.1042423248291, 25.369171142578125, 26.63410186767578, 27.899032592773438, 29.16396141052246, 30.428892135620117, 31.69382095336914, 32.9587516784668, 34.22368240356445, 35.48861312866211, 36.7535400390625, 38.018470764160156, 39.28340148925781, 40.54833221435547, 41.813262939453125, 43.07819366455078, 44.34312438964844, 45.608055114746094, 46.872982025146484, 48.13791275024414, 49.4028434753418, 50.66777420043945, 51.93270492553711, 53.1976318359375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 5.0, 6.0, 10.0, 10.0, 8.0, 17.0, 21.0, 17.0, 23.0, 25.0, 18.0, 22.0, 26.0, 40.0, 39.0, 32.0, 33.0, 36.0, 51.0, 24.0, 34.0, 50.0, 43.0, 39.0, 35.0, 42.0, 46.0, 34.0, 24.0, 27.0, 15.0, 26.0, 18.0, 16.0, 17.0, 5.0, 11.0, 16.0, 5.0, 6.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.774852752685547, -27.903209686279297, -27.031564712524414, -26.159921646118164, -25.28827667236328, -24.41663360595703, -23.54499053955078, -22.67334747314453, -21.80170249938965, -20.9300594329834, -20.058414459228516, -19.186771392822266, -18.315128326416016, -17.443483352661133, -16.571840286254883, -15.700196266174316, -14.82855224609375, -13.956908226013184, -13.085264205932617, -12.213621139526367, -11.3419771194458, -10.470333099365234, -9.598690032958984, -8.727046012878418, -7.855401992797852, -6.983757972717285, -6.112114429473877, -5.240470886230469, -4.368826866149902, -3.497182846069336, -2.6255393028259277, -1.7538957595825195, -0.8822498321533203, -0.010606050491333008, 0.8610377311706543, 1.7326815128326416, 2.604325294494629, 3.4759693145751953, 4.3476128578186035, 5.219256401062012, 6.090900421142578, 6.9625444412231445, 7.834187984466553, 8.705831527709961, 9.577475547790527, 10.449119567871094, 11.320762634277344, 12.19240665435791, 13.064050674438477, 13.935694694519043, 14.80733871459961, 15.67898178100586, 16.55062484741211, 17.422269821166992, 18.293912887573242, 19.165557861328125, 20.037200927734375, 20.908843994140625, 21.780488967895508, 22.652132034301758, 23.52377700805664, 24.39542007446289, 25.26706314086914, 26.13870620727539, 27.010351181030273]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 9.0, 9.0, 11.0, 10.0, 17.0, 20.0, 25.0, 22.0, 25.0, 28.0, 32.0, 27.0, 40.0, 35.0, 42.0, 41.0, 37.0, 34.0, 47.0, 40.0, 38.0, 41.0, 51.0, 34.0, 32.0, 29.0, 42.0, 24.0, 21.0, 17.0, 20.0, 22.0, 13.0, 9.0, 9.0, 14.0, 1.0, 6.0, 6.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4453125, -3.33453369140625, -3.2237548828125, -3.11297607421875, -3.002197265625, -2.89141845703125, -2.7806396484375, -2.66986083984375, -2.55908203125, -2.44830322265625, -2.3375244140625, -2.22674560546875, -2.115966796875, -2.00518798828125, -1.8944091796875, -1.78363037109375, -1.6728515625, -1.56207275390625, -1.4512939453125, -1.34051513671875, -1.229736328125, -1.11895751953125, -1.0081787109375, -0.89739990234375, -0.78662109375, -0.67584228515625, -0.5650634765625, -0.45428466796875, -0.343505859375, -0.23272705078125, -0.1219482421875, -0.01116943359375, 0.099609375, 0.21038818359375, 0.3211669921875, 0.43194580078125, 0.542724609375, 0.65350341796875, 0.7642822265625, 0.87506103515625, 0.98583984375, 1.09661865234375, 1.2073974609375, 1.31817626953125, 1.428955078125, 1.53973388671875, 1.6505126953125, 1.76129150390625, 1.8720703125, 1.98284912109375, 2.0936279296875, 2.20440673828125, 2.315185546875, 2.42596435546875, 2.5367431640625, 2.64752197265625, 2.75830078125, 2.86907958984375, 2.9798583984375, 3.09063720703125, 3.201416015625, 3.31219482421875, 3.4229736328125, 3.53375244140625, 3.64453125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 4.0, 5.0, 5.0, 9.0, 9.0, 18.0, 27.0, 25.0, 32.0, 34.0, 44.0, 64.0, 87.0, 102.0, 173.0, 315.0, 880.0, 4307.0, 141100.0, 2864240.0, 1155364.0, 24208.0, 1920.0, 498.0, 240.0, 142.0, 97.0, 63.0, 50.0, 48.0, 27.0, 36.0, 23.0, 22.0, 14.0, 13.0, 7.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.8680419921875, -9.525146484375, -9.1822509765625, -8.83935546875, -8.4964599609375, -8.153564453125, -7.8106689453125, -7.4677734375, -7.1248779296875, -6.781982421875, -6.4390869140625, -6.09619140625, -5.7532958984375, -5.410400390625, -5.0675048828125, -4.724609375, -4.3817138671875, -4.038818359375, -3.6959228515625, -3.35302734375, -3.0101318359375, -2.667236328125, -2.3243408203125, -1.9814453125, -1.6385498046875, -1.295654296875, -0.9527587890625, -0.60986328125, -0.2669677734375, 0.075927734375, 0.4188232421875, 0.76171875, 1.1046142578125, 1.447509765625, 1.7904052734375, 2.13330078125, 2.4761962890625, 2.819091796875, 3.1619873046875, 3.5048828125, 3.8477783203125, 4.190673828125, 4.5335693359375, 4.87646484375, 5.2193603515625, 5.562255859375, 5.9051513671875, 6.248046875, 6.5909423828125, 6.933837890625, 7.2767333984375, 7.61962890625, 7.9625244140625, 8.305419921875, 8.6483154296875, 8.9912109375, 9.3341064453125, 9.677001953125, 10.0198974609375, 10.36279296875, 10.7056884765625, 11.048583984375, 11.3914794921875, 11.734375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 19.0, 15.0, 27.0, 34.0, 58.0, 82.0, 98.0, 180.0, 241.0, 323.0, 441.0, 500.0, 468.0, 431.0, 318.0, 225.0, 169.0, 120.0, 99.0, 42.0, 43.0, 32.0, 20.0, 18.0, 18.0, 7.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.10601806640625, -5.8800048828125, -5.65399169921875, -5.427978515625, -5.20196533203125, -4.9759521484375, -4.74993896484375, -4.52392578125, -4.29791259765625, -4.0718994140625, -3.84588623046875, -3.619873046875, -3.39385986328125, -3.1678466796875, -2.94183349609375, -2.7158203125, -2.48980712890625, -2.2637939453125, -2.03778076171875, -1.811767578125, -1.58575439453125, -1.3597412109375, -1.13372802734375, -0.90771484375, -0.68170166015625, -0.4556884765625, -0.22967529296875, -0.003662109375, 0.22235107421875, 0.4483642578125, 0.67437744140625, 0.900390625, 1.12640380859375, 1.3524169921875, 1.57843017578125, 1.804443359375, 2.03045654296875, 2.2564697265625, 2.48248291015625, 2.70849609375, 2.93450927734375, 3.1605224609375, 3.38653564453125, 3.612548828125, 3.83856201171875, 4.0645751953125, 4.29058837890625, 4.5166015625, 4.74261474609375, 4.9686279296875, 5.19464111328125, 5.420654296875, 5.64666748046875, 5.8726806640625, 6.09869384765625, 6.32470703125, 6.55072021484375, 6.7767333984375, 7.00274658203125, 7.228759765625, 7.45477294921875, 7.6807861328125, 7.90679931640625, 8.1328125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 10.0, 15.0, 21.0, 32.0, 45.0, 56.0, 61.0, 144.0, 184.0, 257.0, 390.0, 725.0, 14677.0, 4105486.0, 69929.0, 907.0, 456.0, 271.0, 203.0, 124.0, 84.0, 61.0, 41.0, 15.0, 20.0, 17.0, 13.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.65625, -37.628173828125, -36.60009765625, -35.572021484375, -34.5439453125, -33.515869140625, -32.48779296875, -31.459716796875, -30.431640625, -29.403564453125, -28.37548828125, -27.347412109375, -26.3193359375, -25.291259765625, -24.26318359375, -23.235107421875, -22.20703125, -21.178955078125, -20.15087890625, -19.122802734375, -18.0947265625, -17.066650390625, -16.03857421875, -15.010498046875, -13.982421875, -12.954345703125, -11.92626953125, -10.898193359375, -9.8701171875, -8.842041015625, -7.81396484375, -6.785888671875, -5.7578125, -4.729736328125, -3.70166015625, -2.673583984375, -1.6455078125, -0.617431640625, 0.41064453125, 1.438720703125, 2.466796875, 3.494873046875, 4.52294921875, 5.551025390625, 6.5791015625, 7.607177734375, 8.63525390625, 9.663330078125, 10.69140625, 11.719482421875, 12.74755859375, 13.775634765625, 14.8037109375, 15.831787109375, 16.85986328125, 17.887939453125, 18.916015625, 19.944091796875, 20.97216796875, 22.000244140625, 23.0283203125, 24.056396484375, 25.08447265625, 26.112548828125, 27.140625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 10.0, 91.0, 430.0, 411.0, 69.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.77948760986328, -23.382638931274414, -19.985790252685547, -16.58894157409668, -13.192092895507812, -9.795244216918945, -6.398395538330078, -3.001546859741211, 0.39530181884765625, 3.7921504974365234, 7.188999176025391, 10.585847854614258, 13.982696533203125, 17.379545211791992, 20.77639389038086, 24.173242568969727, 27.570091247558594, 30.96693992614746, 34.36378860473633, 37.76063537597656, 41.15748596191406, 44.55433654785156, 47.9511833190918, 51.34803009033203, 54.74488067626953, 58.14173126220703, 61.538578033447266, 64.9354248046875, 68.332275390625, 71.7291259765625, 75.1259765625, 78.52281951904297, 81.919677734375, 85.3165283203125, 88.71337890625, 92.11022186279297, 95.50707244873047, 98.90392303466797, 102.30076599121094, 105.69761657714844, 109.09446716308594, 112.49131774902344, 115.88816833496094, 119.2850112915039, 122.6818618774414, 126.0787124633789, 129.47555541992188, 132.87240600585938, 136.26925659179688, 139.66610717773438, 143.06295776367188, 146.45980834960938, 149.85665893554688, 153.2534942626953, 156.6503448486328, 160.0471954345703, 163.4440460205078, 166.8408966064453, 170.2377471923828, 173.6345977783203, 177.03143310546875, 180.42828369140625, 183.82513427734375, 187.22198486328125, 190.61883544921875]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 5.0, 11.0, 10.0, 7.0, 6.0, 13.0, 16.0, 11.0, 29.0, 19.0, 29.0, 40.0, 41.0, 31.0, 36.0, 43.0, 36.0, 51.0, 47.0, 49.0, 49.0, 36.0, 47.0, 49.0, 43.0, 28.0, 32.0, 41.0, 21.0, 26.0, 13.0, 18.0, 15.0, 10.0, 9.0, 11.0, 6.0, 0.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.824111938476562, -21.110454559326172, -20.39679527282715, -19.683137893676758, -18.969478607177734, -18.255821228027344, -17.542163848876953, -16.82850456237793, -16.114845275878906, -15.4011869430542, -14.687528610229492, -13.973871231079102, -13.260211944580078, -12.546554565429688, -11.83289623260498, -11.119237899780273, -10.405580520629883, -9.691922187805176, -8.978263854980469, -8.264606475830078, -7.550947666168213, -6.837289333343506, -6.123631477355957, -5.40997314453125, -4.696314811706543, -3.982656478881836, -3.268998384475708, -2.55534029006958, -1.841681957244873, -1.128023624420166, -0.4143657684326172, 0.29929256439208984, 1.0129528045654297, 1.7266110181808472, 2.4402692317962646, 3.1539273262023926, 3.8675856590270996, 4.581243991851807, 5.2949018478393555, 6.0085601806640625, 6.7222185134887695, 7.435876846313477, 8.149535179138184, 8.86319351196289, 9.576850891113281, 10.290510177612305, 11.004167556762695, 11.717825889587402, 12.43148422241211, 13.145142555236816, 13.858800888061523, 14.572458267211914, 15.286117553710938, 15.999774932861328, 16.71343231201172, 17.427091598510742, 18.140750885009766, 18.854408264160156, 19.56806755065918, 20.28172492980957, 20.995384216308594, 21.709041595458984, 22.422698974609375, 23.1363582611084, 23.85001564025879]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 12.0, 7.0, 11.0, 9.0, 13.0, 15.0, 19.0, 20.0, 25.0, 23.0, 32.0, 28.0, 24.0, 39.0, 39.0, 36.0, 32.0, 48.0, 40.0, 30.0, 45.0, 38.0, 29.0, 33.0, 30.0, 35.0, 26.0, 31.0, 32.0, 35.0, 24.0, 23.0, 14.0, 14.0, 11.0, 14.0, 5.0, 9.0, 8.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-3.298828125, -3.205657958984375, -3.11248779296875, -3.019317626953125, -2.9261474609375, -2.832977294921875, -2.73980712890625, -2.646636962890625, -2.553466796875, -2.460296630859375, -2.36712646484375, -2.273956298828125, -2.1807861328125, -2.087615966796875, -1.99444580078125, -1.901275634765625, -1.80810546875, -1.714935302734375, -1.62176513671875, -1.528594970703125, -1.4354248046875, -1.342254638671875, -1.24908447265625, -1.155914306640625, -1.062744140625, -0.969573974609375, -0.87640380859375, -0.783233642578125, -0.6900634765625, -0.596893310546875, -0.50372314453125, -0.410552978515625, -0.3173828125, -0.224212646484375, -0.13104248046875, -0.037872314453125, 0.0552978515625, 0.148468017578125, 0.24163818359375, 0.334808349609375, 0.427978515625, 0.521148681640625, 0.61431884765625, 0.707489013671875, 0.8006591796875, 0.893829345703125, 0.98699951171875, 1.080169677734375, 1.17333984375, 1.266510009765625, 1.35968017578125, 1.452850341796875, 1.5460205078125, 1.639190673828125, 1.73236083984375, 1.825531005859375, 1.918701171875, 2.011871337890625, 2.10504150390625, 2.198211669921875, 2.2913818359375, 2.384552001953125, 2.47772216796875, 2.570892333984375, 2.6640625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 13.0, 19.0, 25.0, 33.0, 36.0, 65.0, 94.0, 157.0, 237.0, 318.0, 490.0, 707.0, 993.0, 1547.0, 2057.0, 2877.0, 4324.0, 6405.0, 9343.0, 13700.0, 20793.0, 32227.0, 50931.0, 84293.0, 154623.0, 264283.0, 160294.0, 87180.0, 51943.0, 33119.0, 21208.0, 13941.0, 9440.0, 6487.0, 4449.0, 3043.0, 2077.0, 1475.0, 991.0, 721.0, 531.0, 339.0, 213.0, 168.0, 122.0, 94.0, 58.0, 26.0, 22.0, 16.0, 7.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.479248046875, -0.4640464782714844, -0.44884490966796875, -0.4336433410644531, -0.4184417724609375, -0.4032402038574219, -0.38803863525390625, -0.3728370666503906, -0.357635498046875, -0.3424339294433594, -0.32723236083984375, -0.3120307922363281, -0.2968292236328125, -0.2816276550292969, -0.26642608642578125, -0.2512245178222656, -0.23602294921875, -0.22082138061523438, -0.20561981201171875, -0.19041824340820312, -0.1752166748046875, -0.16001510620117188, -0.14481353759765625, -0.12961196899414062, -0.114410400390625, -0.09920883178710938, -0.08400726318359375, -0.06880569458007812, -0.0536041259765625, -0.038402557373046875, -0.02320098876953125, -0.007999420166015625, 0.0072021484375, 0.022403717041015625, 0.03760528564453125, 0.052806854248046875, 0.0680084228515625, 0.08320999145507812, 0.09841156005859375, 0.11361312866210938, 0.128814697265625, 0.14401626586914062, 0.15921783447265625, 0.17441940307617188, 0.1896209716796875, 0.20482254028320312, 0.22002410888671875, 0.23522567749023438, 0.25042724609375, 0.2656288146972656, 0.28083038330078125, 0.2960319519042969, 0.3112335205078125, 0.3264350891113281, 0.34163665771484375, 0.3568382263183594, 0.372039794921875, 0.3872413635253906, 0.40244293212890625, 0.4176445007324219, 0.4328460693359375, 0.4480476379394531, 0.46324920654296875, 0.4784507751464844, 0.49365234375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 9.0, 5.0, 9.0, 18.0, 9.0, 14.0, 13.0, 21.0, 16.0, 18.0, 24.0, 25.0, 35.0, 22.0, 31.0, 35.0, 34.0, 40.0, 31.0, 32.0, 1059.0, 38.0, 40.0, 36.0, 38.0, 40.0, 33.0, 26.0, 27.0, 28.0, 23.0, 17.0, 29.0, 18.0, 21.0, 15.0, 17.0, 11.0, 7.0, 4.0, 7.0, 11.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.7978515625, -1.74188232421875, -1.6859130859375, -1.62994384765625, -1.573974609375, -1.51800537109375, -1.4620361328125, -1.40606689453125, -1.35009765625, -1.29412841796875, -1.2381591796875, -1.18218994140625, -1.126220703125, -1.07025146484375, -1.0142822265625, -0.95831298828125, -0.90234375, -0.84637451171875, -0.7904052734375, -0.73443603515625, -0.678466796875, -0.62249755859375, -0.5665283203125, -0.51055908203125, -0.45458984375, -0.39862060546875, -0.3426513671875, -0.28668212890625, -0.230712890625, -0.17474365234375, -0.1187744140625, -0.06280517578125, -0.0068359375, 0.04913330078125, 0.1051025390625, 0.16107177734375, 0.217041015625, 0.27301025390625, 0.3289794921875, 0.38494873046875, 0.44091796875, 0.49688720703125, 0.5528564453125, 0.60882568359375, 0.664794921875, 0.72076416015625, 0.7767333984375, 0.83270263671875, 0.888671875, 0.94464111328125, 1.0006103515625, 1.05657958984375, 1.112548828125, 1.16851806640625, 1.2244873046875, 1.28045654296875, 1.33642578125, 1.39239501953125, 1.4483642578125, 1.50433349609375, 1.560302734375, 1.61627197265625, 1.6722412109375, 1.72821044921875, 1.7841796875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 11.0, 9.0, 14.0, 32.0, 40.0, 69.0, 97.0, 133.0, 195.0, 312.0, 455.0, 614.0, 873.0, 1323.0, 1910.0, 2697.0, 3740.0, 5565.0, 8157.0, 12025.0, 18152.0, 27632.0, 43856.0, 72808.0, 131890.0, 1319190.0, 190860.0, 96179.0, 55855.0, 34280.0, 21985.0, 14690.0, 9678.0, 6725.0, 4602.0, 3167.0, 2222.0, 1574.0, 1082.0, 748.0, 529.0, 387.0, 243.0, 166.0, 117.0, 92.0, 52.0, 38.0, 21.0, 18.0, 11.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.5166015625, -0.5008277893066406, -0.48505401611328125, -0.4692802429199219, -0.4535064697265625, -0.4377326965332031, -0.42195892333984375, -0.4061851501464844, -0.390411376953125, -0.3746376037597656, -0.35886383056640625, -0.3430900573730469, -0.3273162841796875, -0.3115425109863281, -0.29576873779296875, -0.2799949645996094, -0.26422119140625, -0.24844741821289062, -0.23267364501953125, -0.21689987182617188, -0.2011260986328125, -0.18535232543945312, -0.16957855224609375, -0.15380477905273438, -0.138031005859375, -0.12225723266601562, -0.10648345947265625, -0.09070968627929688, -0.0749359130859375, -0.059162139892578125, -0.04338836669921875, -0.027614593505859375, -0.0118408203125, 0.003932952880859375, 0.01970672607421875, 0.035480499267578125, 0.0512542724609375, 0.06702804565429688, 0.08280181884765625, 0.09857559204101562, 0.114349365234375, 0.13012313842773438, 0.14589691162109375, 0.16167068481445312, 0.1774444580078125, 0.19321823120117188, 0.20899200439453125, 0.22476577758789062, 0.24053955078125, 0.2563133239746094, 0.27208709716796875, 0.2878608703613281, 0.3036346435546875, 0.3194084167480469, 0.33518218994140625, 0.3509559631347656, 0.366729736328125, 0.3825035095214844, 0.39827728271484375, 0.4140510559082031, 0.4298248291015625, 0.4455986022949219, 0.46137237548828125, 0.4771461486816406, 0.492919921875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 7.0, 9.0, 9.0, 13.0, 11.0, 15.0, 20.0, 22.0, 22.0, 38.0, 35.0, 43.0, 44.0, 61.0, 57.0, 56.0, 74.0, 61.0, 49.0, 56.0, 38.0, 49.0, 35.0, 23.0, 20.0, 23.0, 14.0, 15.0, 15.0, 5.0, 9.0, 10.0, 6.0, 4.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00033974647521972656, -0.0003298148512840271, -0.00031988322734832764, -0.0003099516034126282, -0.0003000199794769287, -0.00029008835554122925, -0.0002801567316055298, -0.0002702251076698303, -0.00026029348373413086, -0.0002503618597984314, -0.00024043023586273193, -0.00023049861192703247, -0.000220566987991333, -0.00021063536405563354, -0.00020070374011993408, -0.00019077211618423462, -0.00018084049224853516, -0.0001709088683128357, -0.00016097724437713623, -0.00015104562044143677, -0.0001411139965057373, -0.00013118237257003784, -0.00012125074863433838, -0.00011131912469863892, -0.00010138750076293945, -9.145587682723999e-05, -8.152425289154053e-05, -7.159262895584106e-05, -6.16610050201416e-05, -5.172938108444214e-05, -4.1797757148742676e-05, -3.186613321304321e-05, -2.193450927734375e-05, -1.2002885341644287e-05, -2.0712614059448242e-06, 7.860362529754639e-06, 1.77919864654541e-05, 2.7723610401153564e-05, 3.765523433685303e-05, 4.758685827255249e-05, 5.751848220825195e-05, 6.745010614395142e-05, 7.738173007965088e-05, 8.731335401535034e-05, 9.72449779510498e-05, 0.00010717660188674927, 0.00011710822582244873, 0.0001270398497581482, 0.00013697147369384766, 0.00014690309762954712, 0.00015683472156524658, 0.00016676634550094604, 0.0001766979694366455, 0.00018662959337234497, 0.00019656121730804443, 0.0002064928412437439, 0.00021642446517944336, 0.00022635608911514282, 0.00023628771305084229, 0.00024621933698654175, 0.0002561509609222412, 0.0002660825848579407, 0.00027601420879364014, 0.0002859458327293396, 0.00029587745666503906]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 8.0, 6.0, 4.0, 8.0, 9.0, 7.0, 9.0, 17.0, 23.0, 23.0, 27.0, 36.0, 58.0, 54.0, 76.0, 105.0, 194.0, 363.0, 779.0, 7791.0, 1031378.0, 5795.0, 742.0, 366.0, 185.0, 118.0, 76.0, 59.0, 44.0, 36.0, 30.0, 30.0, 20.0, 17.0, 12.0, 11.0, 8.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005908966064453125, -0.00570148229598999, -0.0054939985275268555, -0.005286514759063721, -0.005079030990600586, -0.004871547222137451, -0.004664063453674316, -0.004456579685211182, -0.004249095916748047, -0.004041612148284912, -0.0038341283798217773, -0.0036266446113586426, -0.003419160842895508, -0.003211677074432373, -0.0030041933059692383, -0.0027967095375061035, -0.0025892257690429688, -0.002381742000579834, -0.0021742582321166992, -0.0019667744636535645, -0.0017592906951904297, -0.001551806926727295, -0.0013443231582641602, -0.0011368393898010254, -0.0009293556213378906, -0.0007218718528747559, -0.0005143880844116211, -0.00030690431594848633, -9.942054748535156e-05, 0.0001080632209777832, 0.00031554698944091797, 0.0005230307579040527, 0.0007305145263671875, 0.0009379982948303223, 0.001145482063293457, 0.0013529658317565918, 0.0015604496002197266, 0.0017679333686828613, 0.001975417137145996, 0.002182900905609131, 0.0023903846740722656, 0.0025978684425354004, 0.002805352210998535, 0.00301283597946167, 0.0032203197479248047, 0.0034278035163879395, 0.0036352872848510742, 0.003842771053314209, 0.004050254821777344, 0.0042577385902404785, 0.004465222358703613, 0.004672706127166748, 0.004880189895629883, 0.005087673664093018, 0.005295157432556152, 0.005502641201019287, 0.005710124969482422, 0.005917608737945557, 0.006125092506408691, 0.006332576274871826, 0.006540060043334961, 0.006747543811798096, 0.0069550275802612305, 0.007162511348724365, 0.0073699951171875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 36.0, 127.0, 273.0, 281.0, 179.0, 78.0, 28.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006201037322171032, -0.000606104324106127, -0.0005921049742028117, -0.0005781055660918355, -0.0005641062161885202, -0.000550106808077544, -0.0005361074581742287, -0.0005221080500632524, -0.0005081087001599371, -0.0004941092920489609, -0.0004801099421456456, -0.00046611056313849986, -0.0004521111841313541, -0.0004381117760203779, -0.00042411242611706257, -0.00041011301800608635, -0.00039611360989511013, -0.00038211423088796437, -0.0003681148518808186, -0.00035411547287367284, -0.0003401160938665271, -0.00032611668575555086, -0.00031211733585223556, -0.00029811792774125934, -0.00028411857783794403, -0.00027011919883079827, -0.0002561198198236525, -0.00024212044081650674, -0.00022812104725744575, -0.0002141216682503, -0.00020012228924315423, -0.00018612289568409324, -0.00017212351667694747, -0.0001581241376698017, -0.00014412475866265595, -0.0001301253796555102, -0.0001161259860964492, -0.00010212660708930343, -8.812722808215767e-05, -7.41278417990543e-05, -6.012846279190853e-05, -4.612908014678396e-05, -3.212969750165939e-05, -1.813031849451363e-05, -4.130935849389061e-06, 9.868446795735508e-06, 2.386782580288127e-05, 3.786721208598465e-05, 5.186659109313041e-05, 6.586597010027617e-05, 7.986535638337955e-05, 9.386473539052531e-05, 0.00010786412167362869, 0.00012186350068077445, 0.0001358628796879202, 0.00014986225869506598, 0.00016386163770221174, 0.0001778610167093575, 0.00019186039571650326, 0.00020585977472364902, 0.00021985916828271002, 0.00023385854728985578, 0.00024785794084891677, 0.00026185731985606253, 0.0002758566988632083]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 3.0, 9.0, 17.0, 13.0, 14.0, 9.0, 17.0, 18.0, 23.0, 25.0, 20.0, 32.0, 19.0, 30.0, 41.0, 44.0, 37.0, 36.0, 50.0, 44.0, 33.0, 39.0, 35.0, 36.0, 43.0, 36.0, 29.0, 24.0, 29.0, 30.0, 22.0, 29.0, 18.0, 14.0, 16.0, 19.0, 15.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014156103134155273, -0.0001367218792438507, -0.00013188272714614868, -0.00012704357504844666, -0.00012220442295074463, -0.0001173652708530426, -0.00011252611875534058, -0.00010768696665763855, -0.00010284781455993652, -9.80086624622345e-05, -9.316951036453247e-05, -8.833035826683044e-05, -8.349120616912842e-05, -7.865205407142639e-05, -7.381290197372437e-05, -6.897374987602234e-05, -6.413459777832031e-05, -5.9295445680618286e-05, -5.445629358291626e-05, -4.9617141485214233e-05, -4.477798938751221e-05, -3.993883728981018e-05, -3.5099685192108154e-05, -3.0260533094406128e-05, -2.54213809967041e-05, -2.0582228899002075e-05, -1.574307680130005e-05, -1.0903924703598022e-05, -6.064772605895996e-06, -1.2256205081939697e-06, 3.6135315895080566e-06, 8.452683687210083e-06, 1.329183578491211e-05, 1.8130987882614136e-05, 2.2970139980316162e-05, 2.780929207801819e-05, 3.2648444175720215e-05, 3.748759627342224e-05, 4.232674837112427e-05, 4.7165900468826294e-05, 5.200505256652832e-05, 5.684420466423035e-05, 6.168335676193237e-05, 6.65225088596344e-05, 7.136166095733643e-05, 7.620081305503845e-05, 8.103996515274048e-05, 8.58791172504425e-05, 9.071826934814453e-05, 9.555742144584656e-05, 0.00010039657354354858, 0.00010523572564125061, 0.00011007487773895264, 0.00011491402983665466, 0.00011975318193435669, 0.00012459233403205872, 0.00012943148612976074, 0.00013427063822746277, 0.0001391097903251648, 0.00014394894242286682, 0.00014878809452056885, 0.00015362724661827087, 0.0001584663987159729, 0.00016330555081367493, 0.00016814470291137695]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 12.0, 7.0, 11.0, 9.0, 13.0, 15.0, 19.0, 20.0, 25.0, 23.0, 32.0, 28.0, 24.0, 39.0, 39.0, 36.0, 32.0, 48.0, 40.0, 30.0, 45.0, 38.0, 29.0, 33.0, 30.0, 35.0, 26.0, 31.0, 32.0, 35.0, 24.0, 23.0, 14.0, 14.0, 11.0, 14.0, 5.0, 9.0, 8.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-3.298828125, -3.205657958984375, -3.11248779296875, -3.019317626953125, -2.9261474609375, -2.832977294921875, -2.73980712890625, -2.646636962890625, -2.553466796875, -2.460296630859375, -2.36712646484375, -2.273956298828125, -2.1807861328125, -2.087615966796875, -1.99444580078125, -1.901275634765625, -1.80810546875, -1.714935302734375, -1.62176513671875, -1.528594970703125, -1.4354248046875, -1.342254638671875, -1.24908447265625, -1.155914306640625, -1.062744140625, -0.969573974609375, -0.87640380859375, -0.783233642578125, -0.6900634765625, -0.596893310546875, -0.50372314453125, -0.410552978515625, -0.3173828125, -0.224212646484375, -0.13104248046875, -0.037872314453125, 0.0552978515625, 0.148468017578125, 0.24163818359375, 0.334808349609375, 0.427978515625, 0.521148681640625, 0.61431884765625, 0.707489013671875, 0.8006591796875, 0.893829345703125, 0.98699951171875, 1.080169677734375, 1.17333984375, 1.266510009765625, 1.35968017578125, 1.452850341796875, 1.5460205078125, 1.639190673828125, 1.73236083984375, 1.825531005859375, 1.918701171875, 2.011871337890625, 2.10504150390625, 2.198211669921875, 2.2913818359375, 2.384552001953125, 2.47772216796875, 2.570892333984375, 2.6640625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 9.0, 7.0, 20.0, 14.0, 24.0, 29.0, 30.0, 39.0, 58.0, 80.0, 112.0, 142.0, 273.0, 495.0, 1010.0, 2377.0, 5800.0, 14689.0, 36508.0, 86675.0, 198967.0, 367400.0, 191269.0, 83299.0, 34925.0, 14155.0, 5571.0, 2280.0, 972.0, 476.0, 231.0, 168.0, 92.0, 72.0, 57.0, 57.0, 28.0, 30.0, 26.0, 21.0, 14.0, 15.0, 7.0, 10.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0], "bins": [-3.607421875, -3.5057373046875, -3.404052734375, -3.3023681640625, -3.20068359375, -3.0989990234375, -2.997314453125, -2.8956298828125, -2.7939453125, -2.6922607421875, -2.590576171875, -2.4888916015625, -2.38720703125, -2.2855224609375, -2.183837890625, -2.0821533203125, -1.98046875, -1.8787841796875, -1.777099609375, -1.6754150390625, -1.57373046875, -1.4720458984375, -1.370361328125, -1.2686767578125, -1.1669921875, -1.0653076171875, -0.963623046875, -0.8619384765625, -0.76025390625, -0.6585693359375, -0.556884765625, -0.4552001953125, -0.353515625, -0.2518310546875, -0.150146484375, -0.0484619140625, 0.05322265625, 0.1549072265625, 0.256591796875, 0.3582763671875, 0.4599609375, 0.5616455078125, 0.663330078125, 0.7650146484375, 0.86669921875, 0.9683837890625, 1.070068359375, 1.1717529296875, 1.2734375, 1.3751220703125, 1.476806640625, 1.5784912109375, 1.68017578125, 1.7818603515625, 1.883544921875, 1.9852294921875, 2.0869140625, 2.1885986328125, 2.290283203125, 2.3919677734375, 2.49365234375, 2.5953369140625, 2.697021484375, 2.7987060546875, 2.900390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 8.0, 6.0, 16.0, 10.0, 14.0, 16.0, 22.0, 31.0, 19.0, 28.0, 40.0, 28.0, 35.0, 43.0, 59.0, 73.0, 148.0, 351.0, 1455.0, 164.0, 83.0, 47.0, 36.0, 34.0, 38.0, 29.0, 30.0, 19.0, 30.0, 23.0, 22.0, 17.0, 10.0, 12.0, 11.0, 6.0, 8.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0625, -9.7275390625, -9.392578125, -9.0576171875, -8.72265625, -8.3876953125, -8.052734375, -7.7177734375, -7.3828125, -7.0478515625, -6.712890625, -6.3779296875, -6.04296875, -5.7080078125, -5.373046875, -5.0380859375, -4.703125, -4.3681640625, -4.033203125, -3.6982421875, -3.36328125, -3.0283203125, -2.693359375, -2.3583984375, -2.0234375, -1.6884765625, -1.353515625, -1.0185546875, -0.68359375, -0.3486328125, -0.013671875, 0.3212890625, 0.65625, 0.9912109375, 1.326171875, 1.6611328125, 1.99609375, 2.3310546875, 2.666015625, 3.0009765625, 3.3359375, 3.6708984375, 4.005859375, 4.3408203125, 4.67578125, 5.0107421875, 5.345703125, 5.6806640625, 6.015625, 6.3505859375, 6.685546875, 7.0205078125, 7.35546875, 7.6904296875, 8.025390625, 8.3603515625, 8.6953125, 9.0302734375, 9.365234375, 9.7001953125, 10.03515625, 10.3701171875, 10.705078125, 11.0400390625, 11.375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 10.0, 7.0, 6.0, 11.0, 11.0, 19.0, 13.0, 17.0, 27.0, 32.0, 54.0, 80.0, 116.0, 180.0, 280.0, 611.0, 1715.0, 528739.0, 2609977.0, 2233.0, 634.0, 319.0, 162.0, 116.0, 79.0, 60.0, 48.0, 32.0, 19.0, 22.0, 12.0, 15.0, 9.0, 8.0, 7.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.1875, -39.8173828125, -38.447265625, -37.0771484375, -35.70703125, -34.3369140625, -32.966796875, -31.5966796875, -30.2265625, -28.8564453125, -27.486328125, -26.1162109375, -24.74609375, -23.3759765625, -22.005859375, -20.6357421875, -19.265625, -17.8955078125, -16.525390625, -15.1552734375, -13.78515625, -12.4150390625, -11.044921875, -9.6748046875, -8.3046875, -6.9345703125, -5.564453125, -4.1943359375, -2.82421875, -1.4541015625, -0.083984375, 1.2861328125, 2.65625, 4.0263671875, 5.396484375, 6.7666015625, 8.13671875, 9.5068359375, 10.876953125, 12.2470703125, 13.6171875, 14.9873046875, 16.357421875, 17.7275390625, 19.09765625, 20.4677734375, 21.837890625, 23.2080078125, 24.578125, 25.9482421875, 27.318359375, 28.6884765625, 30.05859375, 31.4287109375, 32.798828125, 34.1689453125, 35.5390625, 36.9091796875, 38.279296875, 39.6494140625, 41.01953125, 42.3896484375, 43.759765625, 45.1298828125, 46.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 27.0, 153.0, 347.0, 315.0, 141.0, 22.0, 2.0, 2.0, 0.0, 1.0], "bins": [-69.21880340576172, -68.00346374511719, -66.78813171386719, -65.57279205322266, -64.35745239257812, -63.14211654663086, -61.926780700683594, -60.71144104003906, -59.4961051940918, -58.28076934814453, -57.0654296875, -55.850093841552734, -54.63475799560547, -53.41941833496094, -52.20408248901367, -50.988746643066406, -49.773406982421875, -48.55807113647461, -47.34273147583008, -46.12739562988281, -44.91205596923828, -43.696720123291016, -42.48138427734375, -41.26604461669922, -40.05070877075195, -38.83537292480469, -37.620033264160156, -36.40469741821289, -35.189361572265625, -33.974021911621094, -32.75868606567383, -31.54334831237793, -30.32801055908203, -29.112672805786133, -27.897335052490234, -26.68199920654297, -25.46666145324707, -24.251323699951172, -23.035987854003906, -21.820650100708008, -20.60531234741211, -19.38997459411621, -18.174636840820312, -16.959300994873047, -15.743963241577148, -14.52862548828125, -13.313288688659668, -12.097951889038086, -10.882614135742188, -9.667276382446289, -8.451939582824707, -7.236602306365967, -6.021265029907227, -4.805927753448486, -3.590590476989746, -2.375253677368164, -1.1599159240722656, 0.05542135238647461, 1.2707586288452148, 2.486095905303955, 3.7014331817626953, 4.9167704582214355, 6.132107734680176, 7.347444534301758, 8.562782287597656]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 9.0, 9.0, 8.0, 14.0, 13.0, 17.0, 23.0, 19.0, 25.0, 19.0, 31.0, 24.0, 35.0, 29.0, 37.0, 26.0, 40.0, 41.0, 38.0, 44.0, 35.0, 40.0, 41.0, 25.0, 33.0, 34.0, 31.0, 20.0, 32.0, 20.0, 27.0, 26.0, 21.0, 16.0, 15.0, 21.0, 6.0, 12.0, 7.0, 7.0, 6.0, 9.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.22670555114746, -20.48387336730957, -19.741043090820312, -18.998210906982422, -18.25537872314453, -17.512548446655273, -16.769716262817383, -16.026885986328125, -15.284053802490234, -14.54122257232666, -13.798391342163086, -13.055559158325195, -12.312727928161621, -11.569896697998047, -10.827064514160156, -10.084233283996582, -9.341402053833008, -8.598570823669434, -7.855739116668701, -7.112907409667969, -6.3700761795043945, -5.62724494934082, -4.884413242340088, -4.1415815353393555, -3.3987503051757812, -2.655918836593628, -1.9130873680114746, -1.1702558994293213, -0.42742443084716797, 0.31540703773498535, 1.0582385063171387, 1.801070213317871, 2.543903350830078, 3.2867348194122314, 4.029566287994385, 4.772397994995117, 5.515229225158691, 6.258060455322266, 7.000892162322998, 7.7437238693237305, 8.486555099487305, 9.229386329650879, 9.972217559814453, 10.715049743652344, 11.457880973815918, 12.200712203979492, 12.943544387817383, 13.686375617980957, 14.429206848144531, 15.172038078308105, 15.91486930847168, 16.65770149230957, 17.400531768798828, 18.14336395263672, 18.88619613647461, 19.6290283203125, 20.371858596801758, 21.11469078063965, 21.857521057128906, 22.600353240966797, 23.343185424804688, 24.086015701293945, 24.828847885131836, 25.571678161621094, 26.314510345458984]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 3.0, 8.0, 8.0, 13.0, 12.0, 11.0, 15.0, 24.0, 16.0, 28.0, 22.0, 24.0, 26.0, 31.0, 31.0, 31.0, 25.0, 40.0, 55.0, 43.0, 41.0, 31.0, 30.0, 35.0, 33.0, 37.0, 23.0, 30.0, 28.0, 26.0, 31.0, 23.0, 22.0, 19.0, 20.0, 21.0, 15.0, 19.0, 9.0, 5.0, 9.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.47265625, -3.370147705078125, -3.26763916015625, -3.165130615234375, -3.0626220703125, -2.960113525390625, -2.85760498046875, -2.755096435546875, -2.652587890625, -2.550079345703125, -2.44757080078125, -2.345062255859375, -2.2425537109375, -2.140045166015625, -2.03753662109375, -1.935028076171875, -1.83251953125, -1.730010986328125, -1.62750244140625, -1.524993896484375, -1.4224853515625, -1.319976806640625, -1.21746826171875, -1.114959716796875, -1.012451171875, -0.909942626953125, -0.80743408203125, -0.704925537109375, -0.6024169921875, -0.499908447265625, -0.39739990234375, -0.294891357421875, -0.1923828125, -0.089874267578125, 0.01263427734375, 0.115142822265625, 0.2176513671875, 0.320159912109375, 0.42266845703125, 0.525177001953125, 0.627685546875, 0.730194091796875, 0.83270263671875, 0.935211181640625, 1.0377197265625, 1.140228271484375, 1.24273681640625, 1.345245361328125, 1.44775390625, 1.550262451171875, 1.65277099609375, 1.755279541015625, 1.8577880859375, 1.960296630859375, 2.06280517578125, 2.165313720703125, 2.267822265625, 2.370330810546875, 2.47283935546875, 2.575347900390625, 2.6778564453125, 2.780364990234375, 2.88287353515625, 2.985382080078125, 3.087890625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 4.0, 8.0, 10.0, 18.0, 23.0, 19.0, 27.0, 26.0, 36.0, 45.0, 55.0, 54.0, 93.0, 103.0, 139.0, 204.0, 432.0, 1782.0, 32566.0, 1352374.0, 2666509.0, 133785.0, 4243.0, 699.0, 246.0, 134.0, 122.0, 99.0, 75.0, 56.0, 46.0, 45.0, 31.0, 29.0, 24.0, 26.0, 18.0, 17.0, 7.0, 10.0, 10.0, 0.0, 4.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0], "bins": [-11.296875, -10.96630859375, -10.6357421875, -10.30517578125, -9.974609375, -9.64404296875, -9.3134765625, -8.98291015625, -8.65234375, -8.32177734375, -7.9912109375, -7.66064453125, -7.330078125, -6.99951171875, -6.6689453125, -6.33837890625, -6.0078125, -5.67724609375, -5.3466796875, -5.01611328125, -4.685546875, -4.35498046875, -4.0244140625, -3.69384765625, -3.36328125, -3.03271484375, -2.7021484375, -2.37158203125, -2.041015625, -1.71044921875, -1.3798828125, -1.04931640625, -0.71875, -0.38818359375, -0.0576171875, 0.27294921875, 0.603515625, 0.93408203125, 1.2646484375, 1.59521484375, 1.92578125, 2.25634765625, 2.5869140625, 2.91748046875, 3.248046875, 3.57861328125, 3.9091796875, 4.23974609375, 4.5703125, 4.90087890625, 5.2314453125, 5.56201171875, 5.892578125, 6.22314453125, 6.5537109375, 6.88427734375, 7.21484375, 7.54541015625, 7.8759765625, 8.20654296875, 8.537109375, 8.86767578125, 9.1982421875, 9.52880859375, 9.859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 10.0, 13.0, 10.0, 14.0, 17.0, 22.0, 28.0, 28.0, 48.0, 72.0, 78.0, 122.0, 137.0, 198.0, 286.0, 381.0, 447.0, 459.0, 419.0, 341.0, 240.0, 185.0, 140.0, 97.0, 62.0, 53.0, 46.0, 27.0, 21.0, 20.0, 13.0, 12.0, 8.0, 6.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.5909423828125, -6.392822265625, -6.1947021484375, -5.99658203125, -5.7984619140625, -5.600341796875, -5.4022216796875, -5.2041015625, -5.0059814453125, -4.807861328125, -4.6097412109375, -4.41162109375, -4.2135009765625, -4.015380859375, -3.8172607421875, -3.619140625, -3.4210205078125, -3.222900390625, -3.0247802734375, -2.82666015625, -2.6285400390625, -2.430419921875, -2.2322998046875, -2.0341796875, -1.8360595703125, -1.637939453125, -1.4398193359375, -1.24169921875, -1.0435791015625, -0.845458984375, -0.6473388671875, -0.44921875, -0.2510986328125, -0.052978515625, 0.1451416015625, 0.34326171875, 0.5413818359375, 0.739501953125, 0.9376220703125, 1.1357421875, 1.3338623046875, 1.531982421875, 1.7301025390625, 1.92822265625, 2.1263427734375, 2.324462890625, 2.5225830078125, 2.720703125, 2.9188232421875, 3.116943359375, 3.3150634765625, 3.51318359375, 3.7113037109375, 3.909423828125, 4.1075439453125, 4.3056640625, 4.5037841796875, 4.701904296875, 4.9000244140625, 5.09814453125, 5.2962646484375, 5.494384765625, 5.6925048828125, 5.890625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 4.0, 8.0, 15.0, 15.0, 18.0, 28.0, 37.0, 40.0, 71.0, 87.0, 124.0, 191.0, 277.0, 402.0, 667.0, 13883.0, 4068152.0, 107829.0, 956.0, 406.0, 279.0, 209.0, 144.0, 116.0, 81.0, 54.0, 42.0, 31.0, 25.0, 16.0, 18.0, 10.0, 11.0, 8.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.875, -28.8671875, -27.859375, -26.8515625, -25.84375, -24.8359375, -23.828125, -22.8203125, -21.8125, -20.8046875, -19.796875, -18.7890625, -17.78125, -16.7734375, -15.765625, -14.7578125, -13.75, -12.7421875, -11.734375, -10.7265625, -9.71875, -8.7109375, -7.703125, -6.6953125, -5.6875, -4.6796875, -3.671875, -2.6640625, -1.65625, -0.6484375, 0.359375, 1.3671875, 2.375, 3.3828125, 4.390625, 5.3984375, 6.40625, 7.4140625, 8.421875, 9.4296875, 10.4375, 11.4453125, 12.453125, 13.4609375, 14.46875, 15.4765625, 16.484375, 17.4921875, 18.5, 19.5078125, 20.515625, 21.5234375, 22.53125, 23.5390625, 24.546875, 25.5546875, 26.5625, 27.5703125, 28.578125, 29.5859375, 30.59375, 31.6015625, 32.609375, 33.6171875, 34.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 48.0, 152.0, 313.0, 313.0, 143.0, 34.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.572322845458984, -29.463878631591797, -27.355432510375977, -25.246986389160156, -23.13854217529297, -21.03009796142578, -18.92165184020996, -16.81320571899414, -14.704761505126953, -12.59631633758545, -10.487871170043945, -8.379426002502441, -6.2709808349609375, -4.162535667419434, -2.0540904998779297, 0.05435466766357422, 2.162799835205078, 4.271245002746582, 6.379690170288086, 8.48813533782959, 10.596580505371094, 12.705025672912598, 14.813470840454102, 16.921916961669922, 19.03036117553711, 21.138805389404297, 23.247251510620117, 25.355697631835938, 27.464141845703125, 29.572586059570312, 31.681032180786133, 33.78947830200195, 35.897926330566406, 38.006370544433594, 40.11481475830078, 42.223262786865234, 44.33170700073242, 46.44015121459961, 48.54859924316406, 50.65704345703125, 52.76548767089844, 54.873931884765625, 56.98237609863281, 59.090824127197266, 61.19926834106445, 63.30771255493164, 65.4161605834961, 67.52460479736328, 69.63304901123047, 71.74149322509766, 73.84993743896484, 75.95838165283203, 78.06683349609375, 80.17527770996094, 82.28372192382812, 84.39216613769531, 86.5006103515625, 88.60905456542969, 90.71749877929688, 92.82594299316406, 94.93438720703125, 97.04283905029297, 99.15128326416016, 101.25972747802734, 103.36817169189453]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 10.0, 4.0, 5.0, 8.0, 7.0, 11.0, 12.0, 15.0, 16.0, 25.0, 18.0, 24.0, 32.0, 28.0, 30.0, 31.0, 47.0, 39.0, 36.0, 49.0, 36.0, 40.0, 36.0, 33.0, 46.0, 40.0, 52.0, 39.0, 32.0, 28.0, 30.0, 18.0, 20.0, 19.0, 12.0, 16.0, 18.0, 9.0, 9.0, 6.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.979713439941406, -22.316659927368164, -21.653608322143555, -20.990554809570312, -20.327503204345703, -19.66444969177246, -19.00139808654785, -18.33834457397461, -17.67529296875, -17.012239456176758, -16.34918785095215, -15.686135292053223, -15.023082733154297, -14.360029220581055, -13.696976661682129, -13.033924102783203, -12.370870590209961, -11.707818031311035, -11.04476547241211, -10.381712913513184, -9.718660354614258, -9.055606842041016, -8.39255428314209, -7.729501724243164, -7.066449165344238, -6.4033966064453125, -5.740344047546387, -5.077291011810303, -4.414238452911377, -3.751185894012451, -3.0881330966949463, -2.4250802993774414, -1.7620258331298828, -1.0989731550216675, -0.43592047691345215, 0.22713220119476318, 0.8901848793029785, 1.5532374382019043, 2.216290235519409, 2.879343032836914, 3.54239559173584, 4.205448150634766, 4.868500709533691, 5.531553745269775, 6.194606304168701, 6.857658863067627, 7.520711898803711, 8.183764457702637, 8.846817016601562, 9.509869575500488, 10.172922134399414, 10.83597469329834, 11.499027252197266, 12.162080764770508, 12.825133323669434, 13.48818588256836, 14.151238441467285, 14.814291000366211, 15.477343559265137, 16.140396118164062, 16.803449630737305, 17.466501235961914, 18.129554748535156, 18.792606353759766, 19.455659866333008]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 2.0, 5.0, 9.0, 12.0, 20.0, 19.0, 20.0, 24.0, 14.0, 34.0, 24.0, 33.0, 26.0, 28.0, 32.0, 32.0, 29.0, 45.0, 54.0, 31.0, 44.0, 39.0, 37.0, 38.0, 39.0, 44.0, 42.0, 33.0, 21.0, 30.0, 24.0, 19.0, 21.0, 15.0, 9.0, 7.0, 11.0, 9.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.472930908203125, -3.36578369140625, -3.258636474609375, -3.1514892578125, -3.044342041015625, -2.93719482421875, -2.830047607421875, -2.722900390625, -2.615753173828125, -2.50860595703125, -2.401458740234375, -2.2943115234375, -2.187164306640625, -2.08001708984375, -1.972869873046875, -1.86572265625, -1.758575439453125, -1.65142822265625, -1.544281005859375, -1.4371337890625, -1.329986572265625, -1.22283935546875, -1.115692138671875, -1.008544921875, -0.901397705078125, -0.79425048828125, -0.687103271484375, -0.5799560546875, -0.472808837890625, -0.36566162109375, -0.258514404296875, -0.1513671875, -0.044219970703125, 0.06292724609375, 0.170074462890625, 0.2772216796875, 0.384368896484375, 0.49151611328125, 0.598663330078125, 0.705810546875, 0.812957763671875, 0.92010498046875, 1.027252197265625, 1.1343994140625, 1.241546630859375, 1.34869384765625, 1.455841064453125, 1.56298828125, 1.670135498046875, 1.77728271484375, 1.884429931640625, 1.9915771484375, 2.098724365234375, 2.20587158203125, 2.313018798828125, 2.420166015625, 2.527313232421875, 2.63446044921875, 2.741607666015625, 2.8487548828125, 2.955902099609375, 3.06304931640625, 3.170196533203125, 3.27734375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 7.0, 7.0, 28.0, 25.0, 24.0, 38.0, 75.0, 111.0, 153.0, 232.0, 304.0, 465.0, 708.0, 994.0, 1375.0, 2013.0, 2846.0, 4301.0, 6010.0, 8886.0, 12490.0, 18304.0, 26968.0, 40852.0, 64013.0, 107949.0, 212449.0, 224806.0, 113778.0, 66679.0, 42513.0, 27692.0, 18796.0, 13148.0, 8884.0, 6214.0, 4451.0, 3141.0, 2034.0, 1442.0, 1045.0, 746.0, 438.0, 347.0, 257.0, 161.0, 121.0, 69.0, 57.0, 38.0, 26.0, 25.0, 6.0, 11.0, 3.0, 6.0, 2.0, 0.0, 3.0], "bins": [-0.52685546875, -0.5104141235351562, -0.4939727783203125, -0.47753143310546875, -0.461090087890625, -0.44464874267578125, -0.4282073974609375, -0.41176605224609375, -0.39532470703125, -0.37888336181640625, -0.3624420166015625, -0.34600067138671875, -0.329559326171875, -0.31311798095703125, -0.2966766357421875, -0.28023529052734375, -0.2637939453125, -0.24735260009765625, -0.2309112548828125, -0.21446990966796875, -0.198028564453125, -0.18158721923828125, -0.1651458740234375, -0.14870452880859375, -0.13226318359375, -0.11582183837890625, -0.0993804931640625, -0.08293914794921875, -0.066497802734375, -0.05005645751953125, -0.0336151123046875, -0.01717376708984375, -0.000732421875, 0.01570892333984375, 0.0321502685546875, 0.04859161376953125, 0.065032958984375, 0.08147430419921875, 0.0979156494140625, 0.11435699462890625, 0.13079833984375, 0.14723968505859375, 0.1636810302734375, 0.18012237548828125, 0.196563720703125, 0.21300506591796875, 0.2294464111328125, 0.24588775634765625, 0.2623291015625, 0.27877044677734375, 0.2952117919921875, 0.31165313720703125, 0.328094482421875, 0.34453582763671875, 0.3609771728515625, 0.37741851806640625, 0.39385986328125, 0.41030120849609375, 0.4267425537109375, 0.44318389892578125, 0.459625244140625, 0.47606658935546875, 0.4925079345703125, 0.5089492797851562, 0.525390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 8.0, 9.0, 9.0, 20.0, 14.0, 17.0, 21.0, 23.0, 27.0, 27.0, 21.0, 36.0, 30.0, 23.0, 38.0, 32.0, 41.0, 39.0, 42.0, 1057.0, 42.0, 51.0, 34.0, 35.0, 25.0, 35.0, 32.0, 24.0, 26.0, 28.0, 26.0, 15.0, 11.0, 15.0, 16.0, 7.0, 9.0, 9.0, 9.0, 2.0, 5.0, 1.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.9033203125, -1.842681884765625, -1.78204345703125, -1.721405029296875, -1.6607666015625, -1.600128173828125, -1.53948974609375, -1.478851318359375, -1.418212890625, -1.357574462890625, -1.29693603515625, -1.236297607421875, -1.1756591796875, -1.115020751953125, -1.05438232421875, -0.993743896484375, -0.93310546875, -0.872467041015625, -0.81182861328125, -0.751190185546875, -0.6905517578125, -0.629913330078125, -0.56927490234375, -0.508636474609375, -0.447998046875, -0.387359619140625, -0.32672119140625, -0.266082763671875, -0.2054443359375, -0.144805908203125, -0.08416748046875, -0.023529052734375, 0.037109375, 0.097747802734375, 0.15838623046875, 0.219024658203125, 0.2796630859375, 0.340301513671875, 0.40093994140625, 0.461578369140625, 0.522216796875, 0.582855224609375, 0.64349365234375, 0.704132080078125, 0.7647705078125, 0.825408935546875, 0.88604736328125, 0.946685791015625, 1.00732421875, 1.067962646484375, 1.12860107421875, 1.189239501953125, 1.2498779296875, 1.310516357421875, 1.37115478515625, 1.431793212890625, 1.492431640625, 1.553070068359375, 1.61370849609375, 1.674346923828125, 1.7349853515625, 1.795623779296875, 1.85626220703125, 1.916900634765625, 1.9775390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 5.0, 10.0, 7.0, 18.0, 41.0, 48.0, 64.0, 89.0, 141.0, 190.0, 289.0, 392.0, 534.0, 825.0, 1153.0, 1567.0, 2190.0, 3289.0, 4575.0, 6722.0, 9891.0, 14788.0, 22682.0, 35484.0, 57403.0, 98210.0, 197229.0, 1315729.0, 125963.0, 70962.0, 43171.0, 27499.0, 17915.0, 11998.0, 8029.0, 5571.0, 3780.0, 2637.0, 1781.0, 1302.0, 888.0, 619.0, 456.0, 340.0, 204.0, 141.0, 96.0, 65.0, 59.0, 35.0, 21.0, 15.0, 10.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.50830078125, -0.49201202392578125, -0.4757232666015625, -0.45943450927734375, -0.443145751953125, -0.42685699462890625, -0.4105682373046875, -0.39427947998046875, -0.37799072265625, -0.36170196533203125, -0.3454132080078125, -0.32912445068359375, -0.312835693359375, -0.29654693603515625, -0.2802581787109375, -0.26396942138671875, -0.2476806640625, -0.23139190673828125, -0.2151031494140625, -0.19881439208984375, -0.182525634765625, -0.16623687744140625, -0.1499481201171875, -0.13365936279296875, -0.11737060546875, -0.10108184814453125, -0.0847930908203125, -0.06850433349609375, -0.052215576171875, -0.03592681884765625, -0.0196380615234375, -0.00334930419921875, 0.012939453125, 0.02922821044921875, 0.0455169677734375, 0.06180572509765625, 0.078094482421875, 0.09438323974609375, 0.1106719970703125, 0.12696075439453125, 0.14324951171875, 0.15953826904296875, 0.1758270263671875, 0.19211578369140625, 0.208404541015625, 0.22469329833984375, 0.2409820556640625, 0.25727081298828125, 0.2735595703125, 0.28984832763671875, 0.3061370849609375, 0.32242584228515625, 0.338714599609375, 0.35500335693359375, 0.3712921142578125, 0.38758087158203125, 0.40386962890625, 0.42015838623046875, 0.4364471435546875, 0.45273590087890625, 0.469024658203125, 0.48531341552734375, 0.5016021728515625, 0.5178909301757812, 0.5341796875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 9.0, 13.0, 11.0, 18.0, 31.0, 34.0, 56.0, 64.0, 93.0, 73.0, 76.0, 99.0, 81.0, 70.0, 87.0, 43.0, 40.0, 26.0, 17.0, 17.0, 16.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000591278076171875, -0.0005702376365661621, -0.0005491971969604492, -0.0005281567573547363, -0.0005071163177490234, -0.00048607587814331055, -0.00046503543853759766, -0.00044399499893188477, -0.0004229545593261719, -0.000401914119720459, -0.0003808736801147461, -0.0003598332405090332, -0.0003387928009033203, -0.0003177523612976074, -0.00029671192169189453, -0.00027567148208618164, -0.00025463104248046875, -0.00023359060287475586, -0.00021255016326904297, -0.00019150972366333008, -0.0001704692840576172, -0.0001494288444519043, -0.0001283884048461914, -0.00010734796524047852, -8.630752563476562e-05, -6.526708602905273e-05, -4.4226646423339844e-05, -2.3186206817626953e-05, -2.1457672119140625e-06, 1.8894672393798828e-05, 3.993511199951172e-05, 6.097555160522461e-05, 8.20159912109375e-05, 0.00010305643081665039, 0.00012409687042236328, 0.00014513731002807617, 0.00016617774963378906, 0.00018721818923950195, 0.00020825862884521484, 0.00022929906845092773, 0.0002503395080566406, 0.0002713799476623535, 0.0002924203872680664, 0.0003134608268737793, 0.0003345012664794922, 0.0003555417060852051, 0.00037658214569091797, 0.00039762258529663086, 0.00041866302490234375, 0.00043970346450805664, 0.00046074390411376953, 0.0004817843437194824, 0.0005028247833251953, 0.0005238652229309082, 0.0005449056625366211, 0.000565946102142334, 0.0005869865417480469, 0.0006080269813537598, 0.0006290674209594727, 0.0006501078605651855, 0.0006711483001708984, 0.0006921887397766113, 0.0007132291793823242, 0.0007342696189880371, 0.00075531005859375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 14.0, 29.0, 41.0, 47.0, 49.0, 114.0, 142.0, 291.0, 830.0, 38302.0, 1006473.0, 1250.0, 376.0, 194.0, 120.0, 87.0, 58.0, 27.0, 23.0, 19.0, 13.0, 7.0, 4.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0155487060546875, -0.015118718147277832, -0.014688730239868164, -0.014258742332458496, -0.013828754425048828, -0.01339876651763916, -0.012968778610229492, -0.012538790702819824, -0.012108802795410156, -0.011678814888000488, -0.01124882698059082, -0.010818839073181152, -0.010388851165771484, -0.009958863258361816, -0.009528875350952148, -0.00909888744354248, -0.008668899536132812, -0.008238911628723145, -0.0078089237213134766, -0.007378935813903809, -0.006948947906494141, -0.006518959999084473, -0.006088972091674805, -0.005658984184265137, -0.005228996276855469, -0.004799008369445801, -0.004369020462036133, -0.003939032554626465, -0.003509044647216797, -0.003079056739807129, -0.002649068832397461, -0.002219080924987793, -0.001789093017578125, -0.001359105110168457, -0.0009291172027587891, -0.0004991292953491211, -6.914138793945312e-05, 0.00036084651947021484, 0.0007908344268798828, 0.0012208223342895508, 0.0016508102416992188, 0.0020807981491088867, 0.0025107860565185547, 0.0029407739639282227, 0.0033707618713378906, 0.0038007497787475586, 0.0042307376861572266, 0.0046607255935668945, 0.0050907135009765625, 0.0055207014083862305, 0.0059506893157958984, 0.006380677223205566, 0.006810665130615234, 0.007240653038024902, 0.00767064094543457, 0.008100628852844238, 0.008530616760253906, 0.008960604667663574, 0.009390592575073242, 0.00982058048248291, 0.010250568389892578, 0.010680556297302246, 0.011110544204711914, 0.011540532112121582, 0.01197052001953125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 41.0, 352.0, 510.0, 101.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0020160379353910685, -0.001980794593691826, -0.001945551368407905, -0.0019103080267086625, -0.00187506468500942, -0.0018398214597254992, -0.0018045781180262566, -0.001769334776327014, -0.0017340915510430932, -0.0016988482093438506, -0.0016636049840599298, -0.0016283616423606873, -0.0015931183006614447, -0.001557875075377524, -0.0015226317336782813, -0.0014873885083943605, -0.001452145166695118, -0.0014169018249958754, -0.0013816585997119546, -0.001346415258012712, -0.0013111719163134694, -0.0012759286910295486, -0.001240685349330306, -0.0012054420076310635, -0.0011701986659318209, -0.0011349553242325783, -0.0010997120989486575, -0.001064468757249415, -0.0010292254155501723, -0.0009939821902662516, -0.000958738848567009, -0.0009234955650754273, -0.0008882522815838456, -0.0008530089980922639, -0.0008177656563930213, -0.0007825223729014397, -0.000747279089409858, -0.0007120358059182763, -0.0006767924642190337, -0.000641549180727452, -0.0006063058972358704, -0.0005710626137442887, -0.0005358192720450461, -0.0005005759885534644, -0.00046533270506188273, -0.0004300893924664706, -0.00039484607987105846, -0.0003596027963794768, -0.0003243594546802342, -0.00028911614208482206, -0.0002538728585932404, -0.00021862954599782825, -0.00018338624795433134, -0.00014814294991083443, -0.0001128996373154223, -7.765635382384062e-05, -4.241304122842848e-05, -7.169739546952769e-06, 2.8073562134522945e-05, 6.331686745397747e-05, 9.856016549747437e-05, 0.00013380346354097128, 0.00016904677613638341, 0.0002042900596279651, 0.00023953337222337723]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 5.0, 8.0, 12.0, 12.0, 11.0, 17.0, 17.0, 21.0, 25.0, 37.0, 22.0, 23.0, 35.0, 37.0, 29.0, 30.0, 50.0, 38.0, 44.0, 63.0, 40.0, 32.0, 42.0, 31.0, 39.0, 22.0, 37.0, 30.0, 22.0, 35.0, 18.0, 16.0, 17.0, 12.0, 14.0, 8.0, 9.0, 5.0, 5.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00023794174194335938, -0.00023050233721733093, -0.0002230629324913025, -0.00021562352776527405, -0.0002081841230392456, -0.00020074471831321716, -0.00019330531358718872, -0.00018586590886116028, -0.00017842650413513184, -0.0001709870994091034, -0.00016354769468307495, -0.0001561082899570465, -0.00014866888523101807, -0.00014122948050498962, -0.00013379007577896118, -0.00012635067105293274, -0.0001189112663269043, -0.00011147186160087585, -0.00010403245687484741, -9.659305214881897e-05, -8.915364742279053e-05, -8.171424269676208e-05, -7.427483797073364e-05, -6.68354332447052e-05, -5.939602851867676e-05, -5.1956623792648315e-05, -4.451721906661987e-05, -3.707781434059143e-05, -2.9638409614562988e-05, -2.2199004888534546e-05, -1.4759600162506104e-05, -7.320195436477661e-06, 1.1920928955078125e-07, 7.558614015579224e-06, 1.4998018741607666e-05, 2.243742346763611e-05, 2.987682819366455e-05, 3.731623291969299e-05, 4.4755637645721436e-05, 5.219504237174988e-05, 5.963444709777832e-05, 6.707385182380676e-05, 7.45132565498352e-05, 8.195266127586365e-05, 8.939206600189209e-05, 9.683147072792053e-05, 0.00010427087545394897, 0.00011171028017997742, 0.00011914968490600586, 0.0001265890896320343, 0.00013402849435806274, 0.0001414678990840912, 0.00014890730381011963, 0.00015634670853614807, 0.00016378611326217651, 0.00017122551798820496, 0.0001786649227142334, 0.00018610432744026184, 0.00019354373216629028, 0.00020098313689231873, 0.00020842254161834717, 0.0002158619463443756, 0.00022330135107040405, 0.0002307407557964325, 0.00023818016052246094]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 2.0, 5.0, 9.0, 12.0, 20.0, 19.0, 20.0, 24.0, 14.0, 34.0, 24.0, 33.0, 26.0, 28.0, 32.0, 32.0, 29.0, 45.0, 54.0, 31.0, 44.0, 39.0, 37.0, 38.0, 39.0, 44.0, 42.0, 33.0, 21.0, 30.0, 24.0, 19.0, 21.0, 15.0, 9.0, 7.0, 11.0, 9.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.472930908203125, -3.36578369140625, -3.258636474609375, -3.1514892578125, -3.044342041015625, -2.93719482421875, -2.830047607421875, -2.722900390625, -2.615753173828125, -2.50860595703125, -2.401458740234375, -2.2943115234375, -2.187164306640625, -2.08001708984375, -1.972869873046875, -1.86572265625, -1.758575439453125, -1.65142822265625, -1.544281005859375, -1.4371337890625, -1.329986572265625, -1.22283935546875, -1.115692138671875, -1.008544921875, -0.901397705078125, -0.79425048828125, -0.687103271484375, -0.5799560546875, -0.472808837890625, -0.36566162109375, -0.258514404296875, -0.1513671875, -0.044219970703125, 0.06292724609375, 0.170074462890625, 0.2772216796875, 0.384368896484375, 0.49151611328125, 0.598663330078125, 0.705810546875, 0.812957763671875, 0.92010498046875, 1.027252197265625, 1.1343994140625, 1.241546630859375, 1.34869384765625, 1.455841064453125, 1.56298828125, 1.670135498046875, 1.77728271484375, 1.884429931640625, 1.9915771484375, 2.098724365234375, 2.20587158203125, 2.313018798828125, 2.420166015625, 2.527313232421875, 2.63446044921875, 2.741607666015625, 2.8487548828125, 2.955902099609375, 3.06304931640625, 3.170196533203125, 3.27734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 10.0, 11.0, 16.0, 24.0, 24.0, 27.0, 37.0, 53.0, 62.0, 98.0, 126.0, 169.0, 264.0, 567.0, 1548.0, 7210.0, 46621.0, 328456.0, 572347.0, 75160.0, 11730.0, 2138.0, 719.0, 369.0, 203.0, 141.0, 108.0, 63.0, 62.0, 44.0, 31.0, 20.0, 19.0, 15.0, 10.0, 15.0, 6.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.50018310546875, -7.2738037109375, -7.04742431640625, -6.821044921875, -6.59466552734375, -6.3682861328125, -6.14190673828125, -5.91552734375, -5.68914794921875, -5.4627685546875, -5.23638916015625, -5.010009765625, -4.78363037109375, -4.5572509765625, -4.33087158203125, -4.1044921875, -3.87811279296875, -3.6517333984375, -3.42535400390625, -3.198974609375, -2.97259521484375, -2.7462158203125, -2.51983642578125, -2.29345703125, -2.06707763671875, -1.8406982421875, -1.61431884765625, -1.387939453125, -1.16156005859375, -0.9351806640625, -0.70880126953125, -0.482421875, -0.25604248046875, -0.0296630859375, 0.19671630859375, 0.423095703125, 0.64947509765625, 0.8758544921875, 1.10223388671875, 1.32861328125, 1.55499267578125, 1.7813720703125, 2.00775146484375, 2.234130859375, 2.46051025390625, 2.6868896484375, 2.91326904296875, 3.1396484375, 3.36602783203125, 3.5924072265625, 3.81878662109375, 4.045166015625, 4.27154541015625, 4.4979248046875, 4.72430419921875, 4.95068359375, 5.17706298828125, 5.4034423828125, 5.62982177734375, 5.856201171875, 6.08258056640625, 6.3089599609375, 6.53533935546875, 6.76171875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 5.0, 12.0, 9.0, 16.0, 10.0, 15.0, 23.0, 22.0, 34.0, 30.0, 27.0, 38.0, 40.0, 43.0, 59.0, 71.0, 129.0, 352.0, 1465.0, 147.0, 78.0, 56.0, 45.0, 27.0, 30.0, 28.0, 33.0, 20.0, 19.0, 17.0, 18.0, 11.0, 15.0, 14.0, 13.0, 9.0, 7.0, 9.0, 6.0, 6.0, 5.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.7890625, -10.452880859375, -10.11669921875, -9.780517578125, -9.4443359375, -9.108154296875, -8.77197265625, -8.435791015625, -8.099609375, -7.763427734375, -7.42724609375, -7.091064453125, -6.7548828125, -6.418701171875, -6.08251953125, -5.746337890625, -5.41015625, -5.073974609375, -4.73779296875, -4.401611328125, -4.0654296875, -3.729248046875, -3.39306640625, -3.056884765625, -2.720703125, -2.384521484375, -2.04833984375, -1.712158203125, -1.3759765625, -1.039794921875, -0.70361328125, -0.367431640625, -0.03125, 0.304931640625, 0.64111328125, 0.977294921875, 1.3134765625, 1.649658203125, 1.98583984375, 2.322021484375, 2.658203125, 2.994384765625, 3.33056640625, 3.666748046875, 4.0029296875, 4.339111328125, 4.67529296875, 5.011474609375, 5.34765625, 5.683837890625, 6.02001953125, 6.356201171875, 6.6923828125, 7.028564453125, 7.36474609375, 7.700927734375, 8.037109375, 8.373291015625, 8.70947265625, 9.045654296875, 9.3818359375, 9.718017578125, 10.05419921875, 10.390380859375, 10.7265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 2.0, 9.0, 8.0, 8.0, 11.0, 16.0, 16.0, 24.0, 15.0, 40.0, 30.0, 43.0, 45.0, 55.0, 67.0, 81.0, 124.0, 208.0, 463.0, 1203.0, 21611.0, 3108733.0, 10698.0, 973.0, 406.0, 215.0, 136.0, 112.0, 82.0, 53.0, 46.0, 28.0, 32.0, 24.0, 30.0, 10.0, 12.0, 8.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.61279296875, -33.4755859375, -32.33837890625, -31.201171875, -30.06396484375, -28.9267578125, -27.78955078125, -26.65234375, -25.51513671875, -24.3779296875, -23.24072265625, -22.103515625, -20.96630859375, -19.8291015625, -18.69189453125, -17.5546875, -16.41748046875, -15.2802734375, -14.14306640625, -13.005859375, -11.86865234375, -10.7314453125, -9.59423828125, -8.45703125, -7.31982421875, -6.1826171875, -5.04541015625, -3.908203125, -2.77099609375, -1.6337890625, -0.49658203125, 0.640625, 1.77783203125, 2.9150390625, 4.05224609375, 5.189453125, 6.32666015625, 7.4638671875, 8.60107421875, 9.73828125, 10.87548828125, 12.0126953125, 13.14990234375, 14.287109375, 15.42431640625, 16.5615234375, 17.69873046875, 18.8359375, 19.97314453125, 21.1103515625, 22.24755859375, 23.384765625, 24.52197265625, 25.6591796875, 26.79638671875, 27.93359375, 29.07080078125, 30.2080078125, 31.34521484375, 32.482421875, 33.61962890625, 34.7568359375, 35.89404296875, 37.03125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 22.0, 89.0, 284.0, 360.0, 210.0, 43.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.74382781982422, -51.605743408203125, -50.46765899658203, -49.32957077026367, -48.19148635864258, -47.053401947021484, -45.91531753540039, -44.77722930908203, -43.63914489746094, -42.501060485839844, -41.36297607421875, -40.22488784790039, -39.0868034362793, -37.9487190246582, -36.81063461303711, -35.67254638671875, -34.534461975097656, -33.39637756347656, -32.25829315185547, -31.120206832885742, -29.982120513916016, -28.844036102294922, -27.705951690673828, -26.5678653717041, -25.42978286743164, -24.291698455810547, -23.15361213684082, -22.015527725219727, -20.87744140625, -19.739356994628906, -18.601272583007812, -17.463186264038086, -16.32509994506836, -15.18701457977295, -14.048929214477539, -12.910844802856445, -11.772758483886719, -10.634674072265625, -9.496588706970215, -8.358503341674805, -7.2204179763793945, -6.082332611083984, -4.944247245788574, -3.8061623573303223, -2.668076992034912, -1.529991626739502, -0.39190673828125, 0.7461786270141602, 1.8842639923095703, 3.0223493576049805, 4.160434722900391, 5.298519611358643, 6.436604976654053, 7.574690341949463, 8.712775230407715, 9.850860595703125, 10.988945960998535, 12.127031326293945, 13.265116691589355, 14.403202056884766, 15.54128646850586, 16.679372787475586, 17.81745719909668, 18.955543518066406, 20.0936279296875]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 12.0, 11.0, 16.0, 14.0, 13.0, 36.0, 23.0, 28.0, 37.0, 38.0, 46.0, 41.0, 47.0, 51.0, 50.0, 57.0, 57.0, 48.0, 61.0, 44.0, 42.0, 39.0, 26.0, 33.0, 22.0, 23.0, 13.0, 12.0, 18.0, 7.0, 10.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.57958221435547, -50.222007751464844, -48.86442947387695, -47.50685501098633, -46.14927673339844, -44.79170227050781, -43.43412780761719, -42.0765495300293, -40.71897506713867, -39.36140060424805, -38.003822326660156, -36.64624786376953, -35.28866958618164, -33.931095123291016, -32.573516845703125, -31.2159423828125, -29.858366012573242, -28.500789642333984, -27.143213272094727, -25.78563690185547, -24.428062438964844, -23.070486068725586, -21.712909698486328, -20.355335235595703, -18.997756958007812, -17.640180587768555, -16.282604217529297, -14.925028800964355, -13.567453384399414, -12.209877014160156, -10.852300643920898, -9.494725227355957, -8.137149810791016, -6.779573917388916, -5.421998023986816, -4.064421653747559, -2.706845760345459, -1.3492698669433594, 0.008306503295898438, 1.3658819198608398, 2.7234582901000977, 4.081034183502197, 5.438610076904297, 6.796186447143555, 8.153762817382812, 9.511338233947754, 10.868914604187012, 12.226490020751953, 13.584066390991211, 14.941642761230469, 16.299219131469727, 17.656795501708984, 19.01436996459961, 20.371946334838867, 21.729522705078125, 23.08709716796875, 24.44467544555664, 25.8022518157959, 27.159828186035156, 28.51740264892578, 29.87497901916504, 31.232555389404297, 32.59013366699219, 33.94770812988281, 35.30528259277344]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 4.0, 9.0, 8.0, 14.0, 13.0, 25.0, 24.0, 27.0, 22.0, 27.0, 31.0, 30.0, 29.0, 35.0, 35.0, 41.0, 40.0, 39.0, 41.0, 54.0, 47.0, 23.0, 47.0, 44.0, 34.0, 43.0, 29.0, 28.0, 20.0, 31.0, 14.0, 22.0, 17.0, 1.0, 10.0, 4.0, 11.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.121795654296875, -3.99359130859375, -3.865386962890625, -3.7371826171875, -3.608978271484375, -3.48077392578125, -3.352569580078125, -3.224365234375, -3.096160888671875, -2.96795654296875, -2.839752197265625, -2.7115478515625, -2.583343505859375, -2.45513916015625, -2.326934814453125, -2.19873046875, -2.070526123046875, -1.94232177734375, -1.814117431640625, -1.6859130859375, -1.557708740234375, -1.42950439453125, -1.301300048828125, -1.173095703125, -1.044891357421875, -0.91668701171875, -0.788482666015625, -0.6602783203125, -0.532073974609375, -0.40386962890625, -0.275665283203125, -0.1474609375, -0.019256591796875, 0.10894775390625, 0.237152099609375, 0.3653564453125, 0.493560791015625, 0.62176513671875, 0.749969482421875, 0.878173828125, 1.006378173828125, 1.13458251953125, 1.262786865234375, 1.3909912109375, 1.519195556640625, 1.64739990234375, 1.775604248046875, 1.90380859375, 2.032012939453125, 2.16021728515625, 2.288421630859375, 2.4166259765625, 2.544830322265625, 2.67303466796875, 2.801239013671875, 2.929443359375, 3.057647705078125, 3.18585205078125, 3.314056396484375, 3.4422607421875, 3.570465087890625, 3.69866943359375, 3.826873779296875, 3.955078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 3.0, 12.0, 6.0, 13.0, 17.0, 23.0, 20.0, 39.0, 32.0, 47.0, 65.0, 90.0, 152.0, 237.0, 397.0, 793.0, 2226.0, 10856.0, 79154.0, 524677.0, 1629817.0, 1448927.0, 421252.0, 63009.0, 8751.0, 1964.0, 712.0, 321.0, 213.0, 126.0, 70.0, 68.0, 41.0, 34.0, 24.0, 25.0, 20.0, 14.0, 7.0, 4.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.60546875, -5.43524169921875, -5.2650146484375, -5.09478759765625, -4.924560546875, -4.75433349609375, -4.5841064453125, -4.41387939453125, -4.24365234375, -4.07342529296875, -3.9031982421875, -3.73297119140625, -3.562744140625, -3.39251708984375, -3.2222900390625, -3.05206298828125, -2.8818359375, -2.71160888671875, -2.5413818359375, -2.37115478515625, -2.200927734375, -2.03070068359375, -1.8604736328125, -1.69024658203125, -1.52001953125, -1.34979248046875, -1.1795654296875, -1.00933837890625, -0.839111328125, -0.66888427734375, -0.4986572265625, -0.32843017578125, -0.158203125, 0.01202392578125, 0.1822509765625, 0.35247802734375, 0.522705078125, 0.69293212890625, 0.8631591796875, 1.03338623046875, 1.20361328125, 1.37384033203125, 1.5440673828125, 1.71429443359375, 1.884521484375, 2.05474853515625, 2.2249755859375, 2.39520263671875, 2.5654296875, 2.73565673828125, 2.9058837890625, 3.07611083984375, 3.246337890625, 3.41656494140625, 3.5867919921875, 3.75701904296875, 3.92724609375, 4.09747314453125, 4.2677001953125, 4.43792724609375, 4.608154296875, 4.77838134765625, 4.9486083984375, 5.11883544921875, 5.2890625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 6.0, 11.0, 13.0, 17.0, 16.0, 31.0, 50.0, 48.0, 67.0, 97.0, 134.0, 169.0, 247.0, 305.0, 388.0, 456.0, 423.0, 395.0, 299.0, 235.0, 188.0, 132.0, 81.0, 70.0, 50.0, 33.0, 23.0, 19.0, 15.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.49609375, -7.2811279296875, -7.066162109375, -6.8511962890625, -6.63623046875, -6.4212646484375, -6.206298828125, -5.9913330078125, -5.7763671875, -5.5614013671875, -5.346435546875, -5.1314697265625, -4.91650390625, -4.7015380859375, -4.486572265625, -4.2716064453125, -4.056640625, -3.8416748046875, -3.626708984375, -3.4117431640625, -3.19677734375, -2.9818115234375, -2.766845703125, -2.5518798828125, -2.3369140625, -2.1219482421875, -1.906982421875, -1.6920166015625, -1.47705078125, -1.2620849609375, -1.047119140625, -0.8321533203125, -0.6171875, -0.4022216796875, -0.187255859375, 0.0277099609375, 0.24267578125, 0.4576416015625, 0.672607421875, 0.8875732421875, 1.1025390625, 1.3175048828125, 1.532470703125, 1.7474365234375, 1.96240234375, 2.1773681640625, 2.392333984375, 2.6072998046875, 2.822265625, 3.0372314453125, 3.252197265625, 3.4671630859375, 3.68212890625, 3.8970947265625, 4.112060546875, 4.3270263671875, 4.5419921875, 4.7569580078125, 4.971923828125, 5.1868896484375, 5.40185546875, 5.6168212890625, 5.831787109375, 6.0467529296875, 6.26171875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 11.0, 19.0, 17.0, 26.0, 26.0, 52.0, 68.0, 118.0, 165.0, 261.0, 446.0, 747.0, 1618.0, 10611.0, 3220024.0, 952049.0, 5007.0, 1323.0, 589.0, 358.0, 238.0, 148.0, 107.0, 62.0, 52.0, 42.0, 23.0, 12.0, 9.0, 14.0, 6.0, 7.0, 3.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.715087890625, -19.91455078125, -19.114013671875, -18.3134765625, -17.512939453125, -16.71240234375, -15.911865234375, -15.111328125, -14.310791015625, -13.51025390625, -12.709716796875, -11.9091796875, -11.108642578125, -10.30810546875, -9.507568359375, -8.70703125, -7.906494140625, -7.10595703125, -6.305419921875, -5.5048828125, -4.704345703125, -3.90380859375, -3.103271484375, -2.302734375, -1.502197265625, -0.70166015625, 0.098876953125, 0.8994140625, 1.699951171875, 2.50048828125, 3.301025390625, 4.1015625, 4.902099609375, 5.70263671875, 6.503173828125, 7.3037109375, 8.104248046875, 8.90478515625, 9.705322265625, 10.505859375, 11.306396484375, 12.10693359375, 12.907470703125, 13.7080078125, 14.508544921875, 15.30908203125, 16.109619140625, 16.91015625, 17.710693359375, 18.51123046875, 19.311767578125, 20.1123046875, 20.912841796875, 21.71337890625, 22.513916015625, 23.314453125, 24.114990234375, 24.91552734375, 25.716064453125, 26.5166015625, 27.317138671875, 28.11767578125, 28.918212890625, 29.71875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 42.0, 386.0, 498.0, 86.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-136.50393676757812, -132.3837890625, -128.26364135742188, -124.14350891113281, -120.02336120605469, -115.90321350097656, -111.78307342529297, -107.66293334960938, -103.54278564453125, -99.42263793945312, -95.30249786376953, -91.18235778808594, -87.06221008300781, -82.94206237792969, -78.8219223022461, -74.7017822265625, -70.58163452148438, -66.46148681640625, -62.341346740722656, -58.2212028503418, -54.10105895996094, -49.98091506958008, -45.86077117919922, -41.74062728881836, -37.6204833984375, -33.50033950805664, -29.38019561767578, -25.260051727294922, -21.139907836914062, -17.019763946533203, -12.899620056152344, -8.779476165771484, -4.6593170166015625, -0.5391731262207031, 3.5809707641601562, 7.701114654541016, 11.821258544921875, 15.941402435302734, 20.061546325683594, 24.181690216064453, 28.301834106445312, 32.42197799682617, 36.54212188720703, 40.66226577758789, 44.78240966796875, 48.90255355834961, 53.02269744873047, 57.14284133911133, 61.26298522949219, 65.38313293457031, 69.5032730102539, 73.6234130859375, 77.74356079101562, 81.86370849609375, 85.98384857177734, 90.10398864746094, 94.22413635253906, 98.34428405761719, 102.46442413330078, 106.58456420898438, 110.7047119140625, 114.82485961914062, 118.94499969482422, 123.06513977050781, 127.18528747558594]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 8.0, 3.0, 6.0, 10.0, 19.0, 14.0, 12.0, 19.0, 30.0, 33.0, 39.0, 36.0, 44.0, 32.0, 52.0, 48.0, 47.0, 43.0, 40.0, 48.0, 47.0, 39.0, 48.0, 39.0, 35.0, 28.0, 31.0, 30.0, 15.0, 16.0, 15.0, 15.0, 10.0, 3.0, 14.0, 8.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.92617416381836, -22.146080017089844, -21.365985870361328, -20.585891723632812, -19.805795669555664, -19.02570152282715, -18.245607376098633, -17.465513229370117, -16.68541717529297, -15.905323028564453, -15.125227928161621, -14.345133781433105, -13.565038681030273, -12.784944534301758, -12.004850387573242, -11.224756240844727, -10.444662094116211, -9.664567947387695, -8.884472846984863, -8.104378700256348, -7.324284076690674, -6.544189453125, -5.764095306396484, -4.9840006828308105, -4.203906059265137, -3.423811435699463, -2.643717050552368, -1.8636226654052734, -1.0835280418395996, -0.3034334182739258, 0.47666072845458984, 1.2567553520202637, 2.0368499755859375, 2.8169445991516113, 3.597038984298706, 4.377133369445801, 5.157227993011475, 5.937322616577148, 6.717416763305664, 7.497511386871338, 8.277606010437012, 9.057700157165527, 9.83779525756836, 10.617889404296875, 11.39798355102539, 12.178078651428223, 12.958172798156738, 13.73826789855957, 14.518362045288086, 15.298456192016602, 16.078550338745117, 16.858646392822266, 17.63874053955078, 18.418834686279297, 19.198928833007812, 19.979022979736328, 20.759117126464844, 21.53921127319336, 22.319305419921875, 23.09939956665039, 23.87949562072754, 24.659589767456055, 25.43968391418457, 26.219778060913086, 26.999874114990234]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 10.0, 5.0, 9.0, 7.0, 10.0, 3.0, 20.0, 14.0, 20.0, 20.0, 26.0, 29.0, 21.0, 24.0, 35.0, 35.0, 31.0, 43.0, 35.0, 38.0, 39.0, 36.0, 36.0, 49.0, 48.0, 37.0, 35.0, 30.0, 31.0, 26.0, 28.0, 22.0, 22.0, 20.0, 19.0, 16.0, 15.0, 16.0, 10.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.515625, -3.40960693359375, -3.3035888671875, -3.19757080078125, -3.091552734375, -2.98553466796875, -2.8795166015625, -2.77349853515625, -2.66748046875, -2.56146240234375, -2.4554443359375, -2.34942626953125, -2.243408203125, -2.13739013671875, -2.0313720703125, -1.92535400390625, -1.8193359375, -1.71331787109375, -1.6072998046875, -1.50128173828125, -1.395263671875, -1.28924560546875, -1.1832275390625, -1.07720947265625, -0.97119140625, -0.86517333984375, -0.7591552734375, -0.65313720703125, -0.547119140625, -0.44110107421875, -0.3350830078125, -0.22906494140625, -0.123046875, -0.01702880859375, 0.0889892578125, 0.19500732421875, 0.301025390625, 0.40704345703125, 0.5130615234375, 0.61907958984375, 0.72509765625, 0.83111572265625, 0.9371337890625, 1.04315185546875, 1.149169921875, 1.25518798828125, 1.3612060546875, 1.46722412109375, 1.5732421875, 1.67926025390625, 1.7852783203125, 1.89129638671875, 1.997314453125, 2.10333251953125, 2.2093505859375, 2.31536865234375, 2.42138671875, 2.52740478515625, 2.6334228515625, 2.73944091796875, 2.845458984375, 2.95147705078125, 3.0574951171875, 3.16351318359375, 3.26953125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 3.0, 13.0, 28.0, 20.0, 42.0, 77.0, 123.0, 194.0, 270.0, 392.0, 628.0, 906.0, 1378.0, 2096.0, 3099.0, 5029.0, 8022.0, 12552.0, 20345.0, 33143.0, 57492.0, 106304.0, 230511.0, 275157.0, 125745.0, 66042.0, 37280.0, 22821.0, 14039.0, 8925.0, 5550.0, 3755.0, 2258.0, 1498.0, 928.0, 655.0, 430.0, 261.0, 201.0, 120.0, 85.0, 39.0, 32.0, 33.0, 16.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67041015625, -0.6495361328125, -0.628662109375, -0.6077880859375, -0.5869140625, -0.5660400390625, -0.545166015625, -0.5242919921875, -0.50341796875, -0.4825439453125, -0.461669921875, -0.4407958984375, -0.419921875, -0.3990478515625, -0.378173828125, -0.3572998046875, -0.33642578125, -0.3155517578125, -0.294677734375, -0.2738037109375, -0.2529296875, -0.2320556640625, -0.211181640625, -0.1903076171875, -0.16943359375, -0.1485595703125, -0.127685546875, -0.1068115234375, -0.0859375, -0.0650634765625, -0.044189453125, -0.0233154296875, -0.00244140625, 0.0184326171875, 0.039306640625, 0.0601806640625, 0.0810546875, 0.1019287109375, 0.122802734375, 0.1436767578125, 0.16455078125, 0.1854248046875, 0.206298828125, 0.2271728515625, 0.248046875, 0.2689208984375, 0.289794921875, 0.3106689453125, 0.33154296875, 0.3524169921875, 0.373291015625, 0.3941650390625, 0.4150390625, 0.4359130859375, 0.456787109375, 0.4776611328125, 0.49853515625, 0.5194091796875, 0.540283203125, 0.5611572265625, 0.58203125, 0.6029052734375, 0.623779296875, 0.6446533203125, 0.66552734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 12.0, 9.0, 12.0, 13.0, 11.0, 26.0, 25.0, 42.0, 29.0, 31.0, 44.0, 38.0, 32.0, 56.0, 57.0, 49.0, 1073.0, 58.0, 40.0, 39.0, 48.0, 31.0, 37.0, 31.0, 27.0, 28.0, 22.0, 18.0, 21.0, 10.0, 11.0, 10.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.72064208984375, -2.6365966796875, -2.55255126953125, -2.468505859375, -2.38446044921875, -2.3004150390625, -2.21636962890625, -2.13232421875, -2.04827880859375, -1.9642333984375, -1.88018798828125, -1.796142578125, -1.71209716796875, -1.6280517578125, -1.54400634765625, -1.4599609375, -1.37591552734375, -1.2918701171875, -1.20782470703125, -1.123779296875, -1.03973388671875, -0.9556884765625, -0.87164306640625, -0.78759765625, -0.70355224609375, -0.6195068359375, -0.53546142578125, -0.451416015625, -0.36737060546875, -0.2833251953125, -0.19927978515625, -0.115234375, -0.03118896484375, 0.0528564453125, 0.13690185546875, 0.220947265625, 0.30499267578125, 0.3890380859375, 0.47308349609375, 0.55712890625, 0.64117431640625, 0.7252197265625, 0.80926513671875, 0.893310546875, 0.97735595703125, 1.0614013671875, 1.14544677734375, 1.2294921875, 1.31353759765625, 1.3975830078125, 1.48162841796875, 1.565673828125, 1.64971923828125, 1.7337646484375, 1.81781005859375, 1.90185546875, 1.98590087890625, 2.0699462890625, 2.15399169921875, 2.238037109375, 2.32208251953125, 2.4061279296875, 2.49017333984375, 2.57421875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 11.0, 18.0, 22.0, 21.0, 38.0, 55.0, 95.0, 121.0, 213.0, 304.0, 470.0, 703.0, 1067.0, 1617.0, 2584.0, 4043.0, 6446.0, 10297.0, 16710.0, 28174.0, 49398.0, 92615.0, 206317.0, 1373086.0, 137841.0, 68475.0, 38144.0, 22234.0, 13306.0, 8332.0, 5037.0, 3262.0, 2113.0, 1328.0, 939.0, 550.0, 375.0, 248.0, 180.0, 104.0, 87.0, 51.0, 41.0, 18.0, 12.0, 10.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.74951171875, -0.7269821166992188, -0.7044525146484375, -0.6819229125976562, -0.659393310546875, -0.6368637084960938, -0.6143341064453125, -0.5918045043945312, -0.56927490234375, -0.5467453002929688, -0.5242156982421875, -0.5016860961914062, -0.479156494140625, -0.45662689208984375, -0.4340972900390625, -0.41156768798828125, -0.3890380859375, -0.36650848388671875, -0.3439788818359375, -0.32144927978515625, -0.298919677734375, -0.27639007568359375, -0.2538604736328125, -0.23133087158203125, -0.20880126953125, -0.18627166748046875, -0.1637420654296875, -0.14121246337890625, -0.118682861328125, -0.09615325927734375, -0.0736236572265625, -0.05109405517578125, -0.028564453125, -0.00603485107421875, 0.0164947509765625, 0.03902435302734375, 0.061553955078125, 0.08408355712890625, 0.1066131591796875, 0.12914276123046875, 0.15167236328125, 0.17420196533203125, 0.1967315673828125, 0.21926116943359375, 0.241790771484375, 0.26432037353515625, 0.2868499755859375, 0.30937957763671875, 0.3319091796875, 0.35443878173828125, 0.3769683837890625, 0.39949798583984375, 0.422027587890625, 0.44455718994140625, 0.4670867919921875, 0.48961639404296875, 0.51214599609375, 0.5346755981445312, 0.5572052001953125, 0.5797348022460938, 0.602264404296875, 0.6247940063476562, 0.6473236083984375, 0.6698532104492188, 0.6923828125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 0.0, 8.0, 9.0, 16.0, 15.0, 22.0, 18.0, 16.0, 24.0, 34.0, 26.0, 44.0, 46.0, 38.0, 59.0, 78.0, 50.0, 59.0, 68.0, 60.0, 46.0, 47.0, 40.0, 28.0, 24.0, 27.0, 16.0, 11.0, 17.0, 3.0, 4.0, 7.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0004138946533203125, -0.0004028528928756714, -0.0003918111324310303, -0.00038076937198638916, -0.00036972761154174805, -0.00035868585109710693, -0.0003476440906524658, -0.0003366023302078247, -0.0003255605697631836, -0.0003145188093185425, -0.00030347704887390137, -0.00029243528842926025, -0.00028139352798461914, -0.00027035176753997803, -0.0002593100070953369, -0.0002482682466506958, -0.0002372264862060547, -0.00022618472576141357, -0.00021514296531677246, -0.00020410120487213135, -0.00019305944442749023, -0.00018201768398284912, -0.000170975923538208, -0.0001599341630935669, -0.00014889240264892578, -0.00013785064220428467, -0.00012680888175964355, -0.00011576712131500244, -0.00010472536087036133, -9.368360042572021e-05, -8.26418399810791e-05, -7.160007953643799e-05, -6.0558319091796875e-05, -4.951655864715576e-05, -3.847479820251465e-05, -2.7433037757873535e-05, -1.6391277313232422e-05, -5.349516868591309e-06, 5.692243576049805e-06, 1.6734004020690918e-05, 2.777576446533203e-05, 3.8817524909973145e-05, 4.985928535461426e-05, 6.090104579925537e-05, 7.194280624389648e-05, 8.29845666885376e-05, 9.402632713317871e-05, 0.00010506808757781982, 0.00011610984802246094, 0.00012715160846710205, 0.00013819336891174316, 0.00014923512935638428, 0.0001602768898010254, 0.0001713186502456665, 0.00018236041069030762, 0.00019340217113494873, 0.00020444393157958984, 0.00021548569202423096, 0.00022652745246887207, 0.00023756921291351318, 0.0002486109733581543, 0.0002596527338027954, 0.0002706944942474365, 0.00028173625469207764, 0.00029277801513671875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 8.0, 6.0, 5.0, 11.0, 9.0, 6.0, 9.0, 11.0, 17.0, 42.0, 29.0, 24.0, 45.0, 73.0, 106.0, 161.0, 221.0, 429.0, 1074.0, 89148.0, 953838.0, 1781.0, 619.0, 240.0, 165.0, 104.0, 67.0, 66.0, 49.0, 42.0, 31.0, 20.0, 24.0, 22.0, 13.0, 5.0, 6.0, 7.0, 4.0, 4.0, 6.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006134033203125, -0.005899786949157715, -0.00566554069519043, -0.0054312944412231445, -0.005197048187255859, -0.004962801933288574, -0.004728555679321289, -0.004494309425354004, -0.004260063171386719, -0.004025816917419434, -0.0037915706634521484, -0.0035573244094848633, -0.003323078155517578, -0.003088831901550293, -0.002854585647583008, -0.0026203393936157227, -0.0023860931396484375, -0.0021518468856811523, -0.0019176006317138672, -0.001683354377746582, -0.0014491081237792969, -0.0012148618698120117, -0.0009806156158447266, -0.0007463693618774414, -0.0005121231079101562, -0.0002778768539428711, -4.363059997558594e-05, 0.00019061565399169922, 0.0004248619079589844, 0.0006591081619262695, 0.0008933544158935547, 0.0011276006698608398, 0.001361846923828125, 0.0015960931777954102, 0.0018303394317626953, 0.0020645856857299805, 0.0022988319396972656, 0.0025330781936645508, 0.002767324447631836, 0.003001570701599121, 0.0032358169555664062, 0.0034700632095336914, 0.0037043094635009766, 0.003938555717468262, 0.004172801971435547, 0.004407048225402832, 0.004641294479370117, 0.004875540733337402, 0.0051097869873046875, 0.005344033241271973, 0.005578279495239258, 0.005812525749206543, 0.006046772003173828, 0.006281018257141113, 0.0065152645111083984, 0.006749510765075684, 0.006983757019042969, 0.007218003273010254, 0.007452249526977539, 0.007686495780944824, 0.00792074203491211, 0.008154988288879395, 0.00838923454284668, 0.008623480796813965, 0.00885772705078125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 17.0, 29.0, 46.0, 102.0, 148.0, 166.0, 171.0, 132.0, 95.0, 57.0, 20.0, 8.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002174089604523033, -0.00020824294188059866, -0.00019907692330889404, -0.0001899109047371894, -0.00018074488616548479, -0.00017157886759378016, -0.00016241284902207553, -0.0001532468304503709, -0.00014408081187866628, -0.00013491479330696166, -0.00012574877473525703, -0.0001165827561635524, -0.00010741673759184778, -9.825071902014315e-05, -8.908470044843853e-05, -7.99186818767339e-05, -7.075266330502927e-05, -6.158664473332465e-05, -5.242062616162002e-05, -4.3254607589915395e-05, -3.408858901821077e-05, -2.4922570446506143e-05, -1.5756551874801517e-05, -6.5905333030968904e-06, 2.5754852686077356e-06, 1.1741503840312362e-05, 2.0907522412016988e-05, 3.0073540983721614e-05, 3.923955955542624e-05, 4.8405578127130866e-05, 5.757159669883549e-05, 6.673761527054012e-05, 7.590363384224474e-05, 8.506965241394937e-05, 9.4235670985654e-05, 0.00010340168955735862, 0.00011256770812906325, 0.00012173372670076787, 0.0001308997452724725, 0.00014006576384417713, 0.00014923178241588175, 0.00015839780098758638, 0.000167563819559291, 0.00017672983813099563, 0.00018589585670270026, 0.00019506187527440488, 0.0002042278938461095, 0.00021339391241781414, 0.00022255993098951876, 0.0002317259495612234, 0.00024089196813292801, 0.00025005798670463264, 0.00025922400527633727, 0.0002683900238480419, 0.0002775560424197465, 0.00028672206099145114, 0.00029588807956315577, 0.0003050540981348604, 0.000314220116706565, 0.00032338613527826965, 0.0003325521538499743, 0.0003417181724216789, 0.0003508841909933835, 0.00036005020956508815, 0.0003692162281367928]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 5.0, 6.0, 6.0, 7.0, 12.0, 6.0, 13.0, 11.0, 14.0, 16.0, 15.0, 25.0, 27.0, 35.0, 33.0, 26.0, 47.0, 34.0, 35.0, 45.0, 46.0, 34.0, 40.0, 51.0, 22.0, 39.0, 29.0, 39.0, 37.0, 38.0, 30.0, 26.0, 31.0, 12.0, 18.0, 19.0, 12.0, 8.0, 17.0, 6.0, 3.0, 3.0, 1.0, 5.0, 7.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.0001887679100036621, -0.00018302258104085922, -0.00017727725207805634, -0.00017153192311525345, -0.00016578659415245056, -0.00016004126518964767, -0.0001542959362268448, -0.0001485506072640419, -0.00014280527830123901, -0.00013705994933843613, -0.00013131462037563324, -0.00012556929141283035, -0.00011982396245002747, -0.00011407863348722458, -0.00010833330452442169, -0.0001025879755616188, -9.684264659881592e-05, -9.109731763601303e-05, -8.535198867321014e-05, -7.960665971040726e-05, -7.386133074760437e-05, -6.811600178480148e-05, -6.23706728219986e-05, -5.662534385919571e-05, -5.088001489639282e-05, -4.5134685933589935e-05, -3.938935697078705e-05, -3.364402800798416e-05, -2.7898699045181274e-05, -2.2153370082378387e-05, -1.64080411195755e-05, -1.0662712156772614e-05, -4.9173831939697266e-06, 8.279457688331604e-07, 6.573274731636047e-06, 1.2318603694438934e-05, 1.806393265724182e-05, 2.3809261620044708e-05, 2.9554590582847595e-05, 3.529991954565048e-05, 4.104524850845337e-05, 4.6790577471256256e-05, 5.253590643405914e-05, 5.828123539686203e-05, 6.402656435966492e-05, 6.97718933224678e-05, 7.551722228527069e-05, 8.126255124807358e-05, 8.700788021087646e-05, 9.275320917367935e-05, 9.849853813648224e-05, 0.00010424386709928513, 0.00010998919606208801, 0.0001157345250248909, 0.00012147985398769379, 0.00012722518295049667, 0.00013297051191329956, 0.00013871584087610245, 0.00014446116983890533, 0.00015020649880170822, 0.0001559518277645111, 0.000161697156727314, 0.00016744248569011688, 0.00017318781465291977, 0.00017893314361572266]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 10.0, 5.0, 9.0, 7.0, 10.0, 3.0, 20.0, 14.0, 20.0, 20.0, 26.0, 29.0, 21.0, 24.0, 35.0, 35.0, 31.0, 43.0, 35.0, 38.0, 39.0, 36.0, 36.0, 49.0, 48.0, 37.0, 35.0, 30.0, 31.0, 26.0, 28.0, 22.0, 22.0, 20.0, 19.0, 16.0, 15.0, 16.0, 10.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.515625, -3.40960693359375, -3.3035888671875, -3.19757080078125, -3.091552734375, -2.98553466796875, -2.8795166015625, -2.77349853515625, -2.66748046875, -2.56146240234375, -2.4554443359375, -2.34942626953125, -2.243408203125, -2.13739013671875, -2.0313720703125, -1.92535400390625, -1.8193359375, -1.71331787109375, -1.6072998046875, -1.50128173828125, -1.395263671875, -1.28924560546875, -1.1832275390625, -1.07720947265625, -0.97119140625, -0.86517333984375, -0.7591552734375, -0.65313720703125, -0.547119140625, -0.44110107421875, -0.3350830078125, -0.22906494140625, -0.123046875, -0.01702880859375, 0.0889892578125, 0.19500732421875, 0.301025390625, 0.40704345703125, 0.5130615234375, 0.61907958984375, 0.72509765625, 0.83111572265625, 0.9371337890625, 1.04315185546875, 1.149169921875, 1.25518798828125, 1.3612060546875, 1.46722412109375, 1.5732421875, 1.67926025390625, 1.7852783203125, 1.89129638671875, 1.997314453125, 2.10333251953125, 2.2093505859375, 2.31536865234375, 2.42138671875, 2.52740478515625, 2.6334228515625, 2.73944091796875, 2.845458984375, 2.95147705078125, 3.0574951171875, 3.16351318359375, 3.26953125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 7.0, 8.0, 12.0, 8.0, 5.0, 11.0, 25.0, 35.0, 37.0, 52.0, 90.0, 152.0, 295.0, 609.0, 1389.0, 3409.0, 8644.0, 21195.0, 52179.0, 136748.0, 326092.0, 300045.0, 118911.0, 46449.0, 18997.0, 7566.0, 3033.0, 1291.0, 569.0, 266.0, 125.0, 89.0, 63.0, 30.0, 25.0, 16.0, 10.0, 20.0, 11.0, 3.0, 5.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0], "bins": [-3.86328125, -3.7459716796875, -3.628662109375, -3.5113525390625, -3.39404296875, -3.2767333984375, -3.159423828125, -3.0421142578125, -2.9248046875, -2.8074951171875, -2.690185546875, -2.5728759765625, -2.45556640625, -2.3382568359375, -2.220947265625, -2.1036376953125, -1.986328125, -1.8690185546875, -1.751708984375, -1.6343994140625, -1.51708984375, -1.3997802734375, -1.282470703125, -1.1651611328125, -1.0478515625, -0.9305419921875, -0.813232421875, -0.6959228515625, -0.57861328125, -0.4613037109375, -0.343994140625, -0.2266845703125, -0.109375, 0.0079345703125, 0.125244140625, 0.2425537109375, 0.35986328125, 0.4771728515625, 0.594482421875, 0.7117919921875, 0.8291015625, 0.9464111328125, 1.063720703125, 1.1810302734375, 1.29833984375, 1.4156494140625, 1.532958984375, 1.6502685546875, 1.767578125, 1.8848876953125, 2.002197265625, 2.1195068359375, 2.23681640625, 2.3541259765625, 2.471435546875, 2.5887451171875, 2.7060546875, 2.8233642578125, 2.940673828125, 3.0579833984375, 3.17529296875, 3.2926025390625, 3.409912109375, 3.5272216796875, 3.64453125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 8.0, 3.0, 6.0, 9.0, 8.0, 12.0, 18.0, 11.0, 21.0, 17.0, 13.0, 21.0, 22.0, 46.0, 42.0, 33.0, 59.0, 54.0, 68.0, 162.0, 1378.0, 416.0, 146.0, 80.0, 53.0, 37.0, 43.0, 36.0, 35.0, 27.0, 28.0, 20.0, 20.0, 14.0, 15.0, 12.0, 6.0, 10.0, 12.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.5078125, -11.13623046875, -10.7646484375, -10.39306640625, -10.021484375, -9.64990234375, -9.2783203125, -8.90673828125, -8.53515625, -8.16357421875, -7.7919921875, -7.42041015625, -7.048828125, -6.67724609375, -6.3056640625, -5.93408203125, -5.5625, -5.19091796875, -4.8193359375, -4.44775390625, -4.076171875, -3.70458984375, -3.3330078125, -2.96142578125, -2.58984375, -2.21826171875, -1.8466796875, -1.47509765625, -1.103515625, -0.73193359375, -0.3603515625, 0.01123046875, 0.3828125, 0.75439453125, 1.1259765625, 1.49755859375, 1.869140625, 2.24072265625, 2.6123046875, 2.98388671875, 3.35546875, 3.72705078125, 4.0986328125, 4.47021484375, 4.841796875, 5.21337890625, 5.5849609375, 5.95654296875, 6.328125, 6.69970703125, 7.0712890625, 7.44287109375, 7.814453125, 8.18603515625, 8.5576171875, 8.92919921875, 9.30078125, 9.67236328125, 10.0439453125, 10.41552734375, 10.787109375, 11.15869140625, 11.5302734375, 11.90185546875, 12.2734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 10.0, 17.0, 22.0, 38.0, 31.0, 50.0, 87.0, 148.0, 267.0, 508.0, 1287.0, 31112.0, 3101959.0, 8069.0, 999.0, 467.0, 202.0, 127.0, 76.0, 57.0, 41.0, 36.0, 19.0, 16.0, 20.0, 5.0, 8.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53125, -28.3681640625, -27.205078125, -26.0419921875, -24.87890625, -23.7158203125, -22.552734375, -21.3896484375, -20.2265625, -19.0634765625, -17.900390625, -16.7373046875, -15.57421875, -14.4111328125, -13.248046875, -12.0849609375, -10.921875, -9.7587890625, -8.595703125, -7.4326171875, -6.26953125, -5.1064453125, -3.943359375, -2.7802734375, -1.6171875, -0.4541015625, 0.708984375, 1.8720703125, 3.03515625, 4.1982421875, 5.361328125, 6.5244140625, 7.6875, 8.8505859375, 10.013671875, 11.1767578125, 12.33984375, 13.5029296875, 14.666015625, 15.8291015625, 16.9921875, 18.1552734375, 19.318359375, 20.4814453125, 21.64453125, 22.8076171875, 23.970703125, 25.1337890625, 26.296875, 27.4599609375, 28.623046875, 29.7861328125, 30.94921875, 32.1123046875, 33.275390625, 34.4384765625, 35.6015625, 36.7646484375, 37.927734375, 39.0908203125, 40.25390625, 41.4169921875, 42.580078125, 43.7431640625, 44.90625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 77.0, 730.0, 202.0, 6.0, 2.0, 2.0], "bins": [-184.623779296875, -181.52517700195312, -178.42657470703125, -175.32798767089844, -172.22938537597656, -169.1307830810547, -166.03219604492188, -162.93359375, -159.83499145507812, -156.73638916015625, -153.63778686523438, -150.53919982910156, -147.4405975341797, -144.3419952392578, -141.243408203125, -138.14480590820312, -135.04620361328125, -131.94760131835938, -128.8489990234375, -125.75041198730469, -122.65180969238281, -119.55320739746094, -116.4546127319336, -113.35601806640625, -110.25741577148438, -107.1588134765625, -104.06021881103516, -100.96162414550781, -97.86302185058594, -94.76441955566406, -91.66582489013672, -88.56723022460938, -85.46862030029297, -82.37002563476562, -79.27142333984375, -76.17282104492188, -73.07422637939453, -69.97563171386719, -66.87702941894531, -63.7784309387207, -60.679832458496094, -57.581233978271484, -54.482635498046875, -51.384037017822266, -48.285438537597656, -45.18684005737305, -42.08824157714844, -38.98964309692383, -35.89104461669922, -32.79244613647461, -29.69384765625, -26.59524917602539, -23.49665069580078, -20.398052215576172, -17.299453735351562, -14.200855255126953, -11.102258682250977, -8.003660202026367, -4.905061721801758, -1.8064632415771484, 1.292135238647461, 4.39073371887207, 7.48933219909668, 10.587930679321289, 13.686529159545898]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 4.0, 6.0, 12.0, 13.0, 11.0, 9.0, 18.0, 24.0, 29.0, 30.0, 24.0, 37.0, 33.0, 41.0, 44.0, 37.0, 43.0, 44.0, 39.0, 34.0, 45.0, 39.0, 42.0, 36.0, 40.0, 33.0, 32.0, 22.0, 19.0, 18.0, 25.0, 23.0, 9.0, 12.0, 13.0, 9.0, 13.0, 6.0, 5.0, 4.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.117712020874023, -28.188800811767578, -27.2598876953125, -26.330976486206055, -25.40206527709961, -24.47315216064453, -23.544240951538086, -22.61532974243164, -21.686416625976562, -20.757505416870117, -19.82859230041504, -18.899681091308594, -17.97076988220215, -17.04185676574707, -16.112945556640625, -15.184033393859863, -14.255122184753418, -13.326210021972656, -12.397298812866211, -11.46838665008545, -10.539474487304688, -9.610563278198242, -8.68165111541748, -7.752738952636719, -6.823827266693115, -5.894915580749512, -4.96600341796875, -4.0370917320251465, -3.108179807662964, -2.1792678833007812, -1.2503561973571777, -0.321444034576416, 0.6074676513671875, 1.5363795757293701, 2.4652915000915527, 3.3942031860351562, 4.323115348815918, 5.2520270347595215, 6.180938720703125, 7.109850883483887, 8.038763046264648, 8.96767520904541, 9.896586418151855, 10.825498580932617, 11.754410743713379, 12.68332290649414, 13.612234115600586, 14.541146278381348, 15.470057487487793, 16.398969650268555, 17.327880859375, 18.256793975830078, 19.185705184936523, 20.11461639404297, 21.043529510498047, 21.972440719604492, 22.901351928710938, 23.830263137817383, 24.75917625427246, 25.688087463378906, 26.61699867248535, 27.54591178894043, 28.474822998046875, 29.403736114501953, 30.3326473236084]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 4.0, 8.0, 12.0, 13.0, 16.0, 10.0, 29.0, 17.0, 15.0, 25.0, 25.0, 31.0, 26.0, 36.0, 37.0, 27.0, 59.0, 40.0, 49.0, 40.0, 34.0, 34.0, 38.0, 36.0, 31.0, 37.0, 37.0, 36.0, 21.0, 30.0, 22.0, 21.0, 9.0, 14.0, 19.0, 12.0, 6.0, 6.0, 7.0, 7.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-3.990234375, -3.873260498046875, -3.75628662109375, -3.639312744140625, -3.5223388671875, -3.405364990234375, -3.28839111328125, -3.171417236328125, -3.054443359375, -2.937469482421875, -2.82049560546875, -2.703521728515625, -2.5865478515625, -2.469573974609375, -2.35260009765625, -2.235626220703125, -2.11865234375, -2.001678466796875, -1.88470458984375, -1.767730712890625, -1.6507568359375, -1.533782958984375, -1.41680908203125, -1.299835205078125, -1.182861328125, -1.065887451171875, -0.94891357421875, -0.831939697265625, -0.7149658203125, -0.597991943359375, -0.48101806640625, -0.364044189453125, -0.2470703125, -0.130096435546875, -0.01312255859375, 0.103851318359375, 0.2208251953125, 0.337799072265625, 0.45477294921875, 0.571746826171875, 0.688720703125, 0.805694580078125, 0.92266845703125, 1.039642333984375, 1.1566162109375, 1.273590087890625, 1.39056396484375, 1.507537841796875, 1.62451171875, 1.741485595703125, 1.85845947265625, 1.975433349609375, 2.0924072265625, 2.209381103515625, 2.32635498046875, 2.443328857421875, 2.560302734375, 2.677276611328125, 2.79425048828125, 2.911224365234375, 3.0281982421875, 3.145172119140625, 3.26214599609375, 3.379119873046875, 3.49609375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 5.0, 9.0, 10.0, 9.0, 6.0, 11.0, 15.0, 21.0, 18.0, 17.0, 28.0, 34.0, 56.0, 64.0, 72.0, 107.0, 167.0, 343.0, 1573.0, 69515.0, 2964696.0, 1143881.0, 12046.0, 764.0, 224.0, 151.0, 83.0, 69.0, 68.0, 40.0, 31.0, 23.0, 24.0, 18.0, 17.0, 13.0, 15.0, 8.0, 12.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9375, -12.53076171875, -12.1240234375, -11.71728515625, -11.310546875, -10.90380859375, -10.4970703125, -10.09033203125, -9.68359375, -9.27685546875, -8.8701171875, -8.46337890625, -8.056640625, -7.64990234375, -7.2431640625, -6.83642578125, -6.4296875, -6.02294921875, -5.6162109375, -5.20947265625, -4.802734375, -4.39599609375, -3.9892578125, -3.58251953125, -3.17578125, -2.76904296875, -2.3623046875, -1.95556640625, -1.548828125, -1.14208984375, -0.7353515625, -0.32861328125, 0.078125, 0.48486328125, 0.8916015625, 1.29833984375, 1.705078125, 2.11181640625, 2.5185546875, 2.92529296875, 3.33203125, 3.73876953125, 4.1455078125, 4.55224609375, 4.958984375, 5.36572265625, 5.7724609375, 6.17919921875, 6.5859375, 6.99267578125, 7.3994140625, 7.80615234375, 8.212890625, 8.61962890625, 9.0263671875, 9.43310546875, 9.83984375, 10.24658203125, 10.6533203125, 11.06005859375, 11.466796875, 11.87353515625, 12.2802734375, 12.68701171875, 13.09375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 9.0, 27.0, 19.0, 43.0, 71.0, 73.0, 103.0, 210.0, 302.0, 411.0, 574.0, 620.0, 530.0, 374.0, 267.0, 165.0, 100.0, 63.0, 43.0, 24.0, 4.0, 11.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.03125, -11.765625, -11.5, -11.234375, -10.96875, -10.703125, -10.4375, -10.171875, -9.90625, -9.640625, -9.375, -9.109375, -8.84375, -8.578125, -8.3125, -8.046875, -7.78125, -7.515625, -7.25, -6.984375, -6.71875, -6.453125, -6.1875, -5.921875, -5.65625, -5.390625, -5.125, -4.859375, -4.59375, -4.328125, -4.0625, -3.796875, -3.53125, -3.265625, -3.0, -2.734375, -2.46875, -2.203125, -1.9375, -1.671875, -1.40625, -1.140625, -0.875, -0.609375, -0.34375, -0.078125, 0.1875, 0.453125, 0.71875, 0.984375, 1.25, 1.515625, 1.78125, 2.046875, 2.3125, 2.578125, 2.84375, 3.109375, 3.375, 3.640625, 3.90625, 4.171875, 4.4375, 4.703125, 4.96875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 5.0, 14.0, 8.0, 17.0, 24.0, 46.0, 50.0, 84.0, 139.0, 195.0, 313.0, 500.0, 1223.0, 16487.0, 3858583.0, 312329.0, 2390.0, 707.0, 380.0, 241.0, 160.0, 130.0, 92.0, 55.0, 36.0, 26.0, 18.0, 9.0, 14.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.0625, -15.205078125, -14.34765625, -13.490234375, -12.6328125, -11.775390625, -10.91796875, -10.060546875, -9.203125, -8.345703125, -7.48828125, -6.630859375, -5.7734375, -4.916015625, -4.05859375, -3.201171875, -2.34375, -1.486328125, -0.62890625, 0.228515625, 1.0859375, 1.943359375, 2.80078125, 3.658203125, 4.515625, 5.373046875, 6.23046875, 7.087890625, 7.9453125, 8.802734375, 9.66015625, 10.517578125, 11.375, 12.232421875, 13.08984375, 13.947265625, 14.8046875, 15.662109375, 16.51953125, 17.376953125, 18.234375, 19.091796875, 19.94921875, 20.806640625, 21.6640625, 22.521484375, 23.37890625, 24.236328125, 25.09375, 25.951171875, 26.80859375, 27.666015625, 28.5234375, 29.380859375, 30.23828125, 31.095703125, 31.953125, 32.810546875, 33.66796875, 34.525390625, 35.3828125, 36.240234375, 37.09765625, 37.955078125, 38.8125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 52.0, 519.0, 401.0, 41.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.8626251220703, -188.92396545410156, -184.98529052734375, -181.046630859375, -177.10797119140625, -173.16929626464844, -169.2306365966797, -165.29196166992188, -161.35330200195312, -157.41464233398438, -153.47596740722656, -149.5373077392578, -145.5986328125, -141.65997314453125, -137.7213134765625, -133.7826385498047, -129.84397888183594, -125.90531158447266, -121.96664428710938, -118.02798461914062, -114.08931732177734, -110.15065002441406, -106.21199035644531, -102.27332305908203, -98.33465576171875, -94.39598846435547, -90.45732116699219, -86.51866149902344, -82.57999420166016, -78.64132690429688, -74.70266723632812, -70.76399993896484, -66.8253402709961, -62.88667297363281, -58.9480094909668, -55.00934600830078, -51.0706787109375, -47.13201141357422, -43.1933479309082, -39.25468444824219, -35.316017150878906, -31.377351760864258, -27.43868637084961, -23.50002098083496, -19.561355590820312, -15.622690200805664, -11.684024810791016, -7.745359420776367, -3.8066940307617188, 0.1319713592529297, 4.070636749267578, 8.009302139282227, 11.947967529296875, 15.886632919311523, 19.825298309326172, 23.76396369934082, 27.70262908935547, 31.641294479370117, 35.579959869384766, 39.51862335205078, 43.45729064941406, 47.395957946777344, 51.33462142944336, 55.273284912109375, 59.211952209472656]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 1.0, 7.0, 4.0, 9.0, 11.0, 12.0, 12.0, 12.0, 19.0, 33.0, 35.0, 36.0, 20.0, 42.0, 39.0, 37.0, 41.0, 47.0, 48.0, 34.0, 50.0, 53.0, 39.0, 43.0, 52.0, 29.0, 31.0, 33.0, 18.0, 31.0, 25.0, 15.0, 12.0, 14.0, 9.0, 10.0, 7.0, 9.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-25.860363006591797, -25.138200759887695, -24.416038513183594, -23.693878173828125, -22.971715927124023, -22.249553680419922, -21.52739143371582, -20.80522918701172, -20.08306884765625, -19.36090660095215, -18.638744354248047, -17.916584014892578, -17.194421768188477, -16.472259521484375, -15.750097274780273, -15.027935981750488, -14.305773735046387, -13.583611488342285, -12.8614501953125, -12.139287948608398, -11.417126655578613, -10.694964408874512, -9.972803115844727, -9.250640869140625, -8.528478622436523, -7.80631685256958, -7.084155082702637, -6.361992835998535, -5.63983154296875, -4.917669296264648, -4.195507526397705, -3.4733457565307617, -2.7511844635009766, -2.029022693634033, -1.3068608045578003, -0.5846989154815674, 0.13746285438537598, 0.8596246242523193, 1.5817866325378418, 2.303948402404785, 3.0261101722717285, 3.748271942138672, 4.470433712005615, 5.192595481872559, 5.91475772857666, 6.636919021606445, 7.359081268310547, 8.081243515014648, 8.803404808044434, 9.525567054748535, 10.24772834777832, 10.969890594482422, 11.692051887512207, 12.414214134216309, 13.136375427246094, 13.858537673950195, 14.580699920654297, 15.302862167358398, 16.0250244140625, 16.74718475341797, 17.46934700012207, 18.191509246826172, 18.913671493530273, 19.635833740234375, 20.357994079589844]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 5.0, 6.0, 13.0, 15.0, 13.0, 17.0, 17.0, 23.0, 38.0, 36.0, 48.0, 49.0, 38.0, 35.0, 53.0, 48.0, 45.0, 37.0, 31.0, 34.0, 35.0, 29.0, 33.0, 41.0, 44.0, 24.0, 30.0, 26.0, 19.0, 19.0, 23.0, 13.0, 8.0, 10.0, 3.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.51171875, -4.388824462890625, -4.26593017578125, -4.143035888671875, -4.0201416015625, -3.897247314453125, -3.77435302734375, -3.651458740234375, -3.528564453125, -3.405670166015625, -3.28277587890625, -3.159881591796875, -3.0369873046875, -2.914093017578125, -2.79119873046875, -2.668304443359375, -2.54541015625, -2.422515869140625, -2.29962158203125, -2.176727294921875, -2.0538330078125, -1.930938720703125, -1.80804443359375, -1.685150146484375, -1.562255859375, -1.439361572265625, -1.31646728515625, -1.193572998046875, -1.0706787109375, -0.947784423828125, -0.82489013671875, -0.701995849609375, -0.5791015625, -0.456207275390625, -0.33331298828125, -0.210418701171875, -0.0875244140625, 0.035369873046875, 0.15826416015625, 0.281158447265625, 0.404052734375, 0.526947021484375, 0.64984130859375, 0.772735595703125, 0.8956298828125, 1.018524169921875, 1.14141845703125, 1.264312744140625, 1.38720703125, 1.510101318359375, 1.63299560546875, 1.755889892578125, 1.8787841796875, 2.001678466796875, 2.12457275390625, 2.247467041015625, 2.370361328125, 2.493255615234375, 2.61614990234375, 2.739044189453125, 2.8619384765625, 2.984832763671875, 3.10772705078125, 3.230621337890625, 3.353515625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 11.0, 16.0, 20.0, 18.0, 31.0, 68.0, 94.0, 124.0, 223.0, 308.0, 491.0, 591.0, 1013.0, 1415.0, 2239.0, 3340.0, 5172.0, 8046.0, 12707.0, 20244.0, 34400.0, 60229.0, 108519.0, 227893.0, 269785.0, 125269.0, 66140.0, 38119.0, 22790.0, 13873.0, 8703.0, 5658.0, 3721.0, 2397.0, 1582.0, 1091.0, 746.0, 491.0, 327.0, 233.0, 118.0, 112.0, 50.0, 55.0, 28.0, 22.0, 22.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7119140625, -0.6904067993164062, -0.6688995361328125, -0.6473922729492188, -0.625885009765625, -0.6043777465820312, -0.5828704833984375, -0.5613632202148438, -0.53985595703125, -0.5183486938476562, -0.4968414306640625, -0.47533416748046875, -0.453826904296875, -0.43231964111328125, -0.4108123779296875, -0.38930511474609375, -0.3677978515625, -0.34629058837890625, -0.3247833251953125, -0.30327606201171875, -0.281768798828125, -0.26026153564453125, -0.2387542724609375, -0.21724700927734375, -0.19573974609375, -0.17423248291015625, -0.1527252197265625, -0.13121795654296875, -0.109710693359375, -0.08820343017578125, -0.0666961669921875, -0.04518890380859375, -0.023681640625, -0.00217437744140625, 0.0193328857421875, 0.04084014892578125, 0.062347412109375, 0.08385467529296875, 0.1053619384765625, 0.12686920166015625, 0.14837646484375, 0.16988372802734375, 0.1913909912109375, 0.21289825439453125, 0.234405517578125, 0.25591278076171875, 0.2774200439453125, 0.29892730712890625, 0.3204345703125, 0.34194183349609375, 0.3634490966796875, 0.38495635986328125, 0.406463623046875, 0.42797088623046875, 0.4494781494140625, 0.47098541259765625, 0.49249267578125, 0.5139999389648438, 0.5355072021484375, 0.5570144653320312, 0.578521728515625, 0.6000289916992188, 0.6215362548828125, 0.6430435180664062, 0.66455078125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 9.0, 6.0, 5.0, 8.0, 10.0, 9.0, 16.0, 12.0, 15.0, 16.0, 32.0, 18.0, 22.0, 27.0, 35.0, 32.0, 36.0, 34.0, 44.0, 37.0, 30.0, 1072.0, 35.0, 37.0, 39.0, 28.0, 38.0, 29.0, 29.0, 32.0, 27.0, 22.0, 20.0, 20.0, 23.0, 18.0, 12.0, 15.0, 18.0, 8.0, 8.0, 10.0, 5.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-2.1328125, -2.067962646484375, -2.00311279296875, -1.938262939453125, -1.8734130859375, -1.808563232421875, -1.74371337890625, -1.678863525390625, -1.614013671875, -1.549163818359375, -1.48431396484375, -1.419464111328125, -1.3546142578125, -1.289764404296875, -1.22491455078125, -1.160064697265625, -1.09521484375, -1.030364990234375, -0.96551513671875, -0.900665283203125, -0.8358154296875, -0.770965576171875, -0.70611572265625, -0.641265869140625, -0.576416015625, -0.511566162109375, -0.44671630859375, -0.381866455078125, -0.3170166015625, -0.252166748046875, -0.18731689453125, -0.122467041015625, -0.0576171875, 0.007232666015625, 0.07208251953125, 0.136932373046875, 0.2017822265625, 0.266632080078125, 0.33148193359375, 0.396331787109375, 0.461181640625, 0.526031494140625, 0.59088134765625, 0.655731201171875, 0.7205810546875, 0.785430908203125, 0.85028076171875, 0.915130615234375, 0.97998046875, 1.044830322265625, 1.10968017578125, 1.174530029296875, 1.2393798828125, 1.304229736328125, 1.36907958984375, 1.433929443359375, 1.498779296875, 1.563629150390625, 1.62847900390625, 1.693328857421875, 1.7581787109375, 1.823028564453125, 1.88787841796875, 1.952728271484375, 2.017578125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 8.0, 10.0, 29.0, 48.0, 67.0, 69.0, 101.0, 193.0, 261.0, 374.0, 521.0, 735.0, 1092.0, 1587.0, 2173.0, 3001.0, 4478.0, 6365.0, 9204.0, 14080.0, 20772.0, 32225.0, 52201.0, 87497.0, 170813.0, 1333718.0, 143218.0, 77321.0, 46323.0, 29155.0, 18954.0, 12593.0, 8440.0, 5884.0, 4102.0, 2749.0, 2101.0, 1400.0, 980.0, 687.0, 475.0, 373.0, 256.0, 157.0, 102.0, 72.0, 62.0, 34.0, 25.0, 16.0, 7.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.57421875, -0.556488037109375, -0.53875732421875, -0.521026611328125, -0.5032958984375, -0.485565185546875, -0.46783447265625, -0.450103759765625, -0.432373046875, -0.414642333984375, -0.39691162109375, -0.379180908203125, -0.3614501953125, -0.343719482421875, -0.32598876953125, -0.308258056640625, -0.29052734375, -0.272796630859375, -0.25506591796875, -0.237335205078125, -0.2196044921875, -0.201873779296875, -0.18414306640625, -0.166412353515625, -0.148681640625, -0.130950927734375, -0.11322021484375, -0.095489501953125, -0.0777587890625, -0.060028076171875, -0.04229736328125, -0.024566650390625, -0.0068359375, 0.010894775390625, 0.02862548828125, 0.046356201171875, 0.0640869140625, 0.081817626953125, 0.09954833984375, 0.117279052734375, 0.135009765625, 0.152740478515625, 0.17047119140625, 0.188201904296875, 0.2059326171875, 0.223663330078125, 0.24139404296875, 0.259124755859375, 0.27685546875, 0.294586181640625, 0.31231689453125, 0.330047607421875, 0.3477783203125, 0.365509033203125, 0.38323974609375, 0.400970458984375, 0.418701171875, 0.436431884765625, 0.45416259765625, 0.471893310546875, 0.4896240234375, 0.507354736328125, 0.52508544921875, 0.542816162109375, 0.560546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 1.0, 2.0, 5.0, 10.0, 15.0, 18.0, 14.0, 19.0, 13.0, 26.0, 28.0, 33.0, 40.0, 43.0, 50.0, 43.0, 70.0, 66.0, 67.0, 50.0, 41.0, 59.0, 45.0, 57.0, 34.0, 32.0, 17.0, 22.0, 12.0, 10.0, 10.0, 5.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0004227161407470703, -0.0004104338586330414, -0.00039815157651901245, -0.0003858692944049835, -0.0003735870122909546, -0.00036130473017692566, -0.00034902244806289673, -0.0003367401659488678, -0.00032445788383483887, -0.00031217560172080994, -0.000299893319606781, -0.0002876110374927521, -0.00027532875537872314, -0.0002630464732646942, -0.0002507641911506653, -0.00023848190903663635, -0.00022619962692260742, -0.0002139173448085785, -0.00020163506269454956, -0.00018935278058052063, -0.0001770704984664917, -0.00016478821635246277, -0.00015250593423843384, -0.0001402236521244049, -0.00012794137001037598, -0.00011565908789634705, -0.00010337680578231812, -9.109452366828918e-05, -7.881224155426025e-05, -6.652995944023132e-05, -5.424767732620239e-05, -4.196539521217346e-05, -2.968311309814453e-05, -1.74008309841156e-05, -5.11854887008667e-06, 7.163733243942261e-06, 1.944601535797119e-05, 3.172829747200012e-05, 4.401057958602905e-05, 5.6292861700057983e-05, 6.857514381408691e-05, 8.085742592811584e-05, 9.313970804214478e-05, 0.0001054219901561737, 0.00011770427227020264, 0.00012998655438423157, 0.0001422688364982605, 0.00015455111861228943, 0.00016683340072631836, 0.0001791156828403473, 0.00019139796495437622, 0.00020368024706840515, 0.00021596252918243408, 0.000228244811296463, 0.00024052709341049194, 0.0002528093755245209, 0.0002650916576385498, 0.00027737393975257874, 0.00028965622186660767, 0.0003019385039806366, 0.00031422078609466553, 0.00032650306820869446, 0.0003387853503227234, 0.0003510676324367523, 0.00036334991455078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 8.0, 8.0, 10.0, 13.0, 12.0, 18.0, 18.0, 22.0, 30.0, 39.0, 63.0, 74.0, 114.0, 179.0, 312.0, 554.0, 2123.0, 1018539.0, 24327.0, 921.0, 378.0, 210.0, 148.0, 88.0, 79.0, 57.0, 36.0, 30.0, 27.0, 28.0, 15.0, 21.0, 13.0, 10.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00717926025390625, -0.0069200992584228516, -0.006660938262939453, -0.006401777267456055, -0.006142616271972656, -0.005883455276489258, -0.005624294281005859, -0.005365133285522461, -0.0051059722900390625, -0.004846811294555664, -0.004587650299072266, -0.004328489303588867, -0.004069328308105469, -0.0038101673126220703, -0.003551006317138672, -0.0032918453216552734, -0.003032684326171875, -0.0027735233306884766, -0.002514362335205078, -0.0022552013397216797, -0.0019960403442382812, -0.0017368793487548828, -0.0014777183532714844, -0.001218557357788086, -0.0009593963623046875, -0.0007002353668212891, -0.0004410743713378906, -0.0001819133758544922, 7.724761962890625e-05, 0.0003364086151123047, 0.0005955696105957031, 0.0008547306060791016, 0.0011138916015625, 0.0013730525970458984, 0.0016322135925292969, 0.0018913745880126953, 0.0021505355834960938, 0.002409696578979492, 0.0026688575744628906, 0.002928018569946289, 0.0031871795654296875, 0.003446340560913086, 0.0037055015563964844, 0.003964662551879883, 0.004223823547363281, 0.00448298454284668, 0.004742145538330078, 0.0050013065338134766, 0.005260467529296875, 0.0055196285247802734, 0.005778789520263672, 0.00603795051574707, 0.006297111511230469, 0.006556272506713867, 0.006815433502197266, 0.007074594497680664, 0.0073337554931640625, 0.007592916488647461, 0.00785207748413086, 0.008111238479614258, 0.008370399475097656, 0.008629560470581055, 0.008888721466064453, 0.009147882461547852, 0.00940704345703125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 12.0, 51.0, 151.0, 318.0, 270.0, 146.0, 55.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005862560938112438, -0.0005699560279026628, -0.0005536559037864208, -0.0005373557796701789, -0.0005210557137615979, -0.0005047556478530169, -0.0004884555237367749, -0.00047215542872436345, -0.00045585533371195197, -0.0004395552386995405, -0.000423255143687129, -0.00040695504867471755, -0.00039065495366230607, -0.0003743548586498946, -0.0003580547636374831, -0.00034175466862507164, -0.00032545457361266017, -0.0003091544786002487, -0.0002928543835878372, -0.00027655428857542574, -0.00026025419356301427, -0.0002439540985506028, -0.00022765400353819132, -0.00021135390852577984, -0.00019505381351336837, -0.0001787537185009569, -0.00016245362348854542, -0.00014615352847613394, -0.00012985343346372247, -0.00011355333845131099, -9.725324343889952e-05, -8.095314842648804e-05, -6.465302431024611e-05, -4.8352929297834635e-05, -3.205283428542316e-05, -1.5752739273011684e-05, 5.473557393997908e-07, 1.6847450751811266e-05, 3.314754576422274e-05, 4.9447640776634216e-05, 6.574773578904569e-05, 8.204783080145717e-05, 9.834792581386864e-05, 0.00011464802082628012, 0.0001309481158386916, 0.00014724821085110307, 0.00016354830586351454, 0.00017984840087592602, 0.0001961484958883375, 0.00021244859090074897, 0.00022874868591316044, 0.0002450487809255719, 0.0002613488759379834, 0.00027764897095039487, 0.00029394906596280634, 0.0003102491609752178, 0.0003265492559876293, 0.00034284935100004077, 0.00035914944601245224, 0.0003754495410248637, 0.0003917496360372752, 0.00040804973104968667, 0.00042434982606209815, 0.0004406499210745096, 0.0004569500160869211]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 11.0, 11.0, 21.0, 28.0, 19.0, 31.0, 34.0, 44.0, 37.0, 48.0, 45.0, 41.0, 38.0, 50.0, 36.0, 49.0, 51.0, 42.0, 42.0, 54.0, 44.0, 18.0, 21.0, 30.0, 22.0, 23.0, 17.0, 17.0, 12.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025659799575805664, -0.0002493634819984436, -0.00024212896823883057, -0.00023489445447921753, -0.0002276599407196045, -0.00022042542695999146, -0.00021319091320037842, -0.00020595639944076538, -0.00019872188568115234, -0.0001914873719215393, -0.00018425285816192627, -0.00017701834440231323, -0.0001697838306427002, -0.00016254931688308716, -0.00015531480312347412, -0.00014808028936386108, -0.00014084577560424805, -0.000133611261844635, -0.00012637674808502197, -0.00011914223432540894, -0.0001119077205657959, -0.00010467320680618286, -9.743869304656982e-05, -9.020417928695679e-05, -8.296966552734375e-05, -7.573515176773071e-05, -6.850063800811768e-05, -6.126612424850464e-05, -5.40316104888916e-05, -4.6797096729278564e-05, -3.956258296966553e-05, -3.232806921005249e-05, -2.5093555450439453e-05, -1.7859041690826416e-05, -1.0624527931213379e-05, -3.390014171600342e-06, 3.844499588012695e-06, 1.1079013347625732e-05, 1.831352710723877e-05, 2.5548040866851807e-05, 3.2782554626464844e-05, 4.001706838607788e-05, 4.725158214569092e-05, 5.4486095905303955e-05, 6.172060966491699e-05, 6.895512342453003e-05, 7.618963718414307e-05, 8.34241509437561e-05, 9.065866470336914e-05, 9.789317846298218e-05, 0.00010512769222259521, 0.00011236220598220825, 0.00011959671974182129, 0.00012683123350143433, 0.00013406574726104736, 0.0001413002610206604, 0.00014853477478027344, 0.00015576928853988647, 0.0001630038022994995, 0.00017023831605911255, 0.00017747282981872559, 0.00018470734357833862, 0.00019194185733795166, 0.0001991763710975647, 0.00020641088485717773]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 5.0, 6.0, 13.0, 15.0, 13.0, 17.0, 17.0, 23.0, 38.0, 36.0, 48.0, 49.0, 38.0, 35.0, 53.0, 48.0, 45.0, 37.0, 31.0, 34.0, 35.0, 29.0, 33.0, 41.0, 44.0, 25.0, 29.0, 26.0, 19.0, 19.0, 23.0, 13.0, 8.0, 10.0, 3.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.51171875, -4.388824462890625, -4.26593017578125, -4.143035888671875, -4.0201416015625, -3.897247314453125, -3.77435302734375, -3.651458740234375, -3.528564453125, -3.405670166015625, -3.28277587890625, -3.159881591796875, -3.0369873046875, -2.914093017578125, -2.79119873046875, -2.668304443359375, -2.54541015625, -2.422515869140625, -2.29962158203125, -2.176727294921875, -2.0538330078125, -1.930938720703125, -1.80804443359375, -1.685150146484375, -1.562255859375, -1.439361572265625, -1.31646728515625, -1.193572998046875, -1.0706787109375, -0.947784423828125, -0.82489013671875, -0.701995849609375, -0.5791015625, -0.456207275390625, -0.33331298828125, -0.210418701171875, -0.0875244140625, 0.035369873046875, 0.15826416015625, 0.281158447265625, 0.404052734375, 0.526947021484375, 0.64984130859375, 0.772735595703125, 0.8956298828125, 1.018524169921875, 1.14141845703125, 1.264312744140625, 1.38720703125, 1.510101318359375, 1.63299560546875, 1.755889892578125, 1.8787841796875, 2.001678466796875, 2.12457275390625, 2.247467041015625, 2.370361328125, 2.493255615234375, 2.61614990234375, 2.739044189453125, 2.8619384765625, 2.984832763671875, 3.10772705078125, 3.230621337890625, 3.353515625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 8.0, 5.0, 14.0, 13.0, 16.0, 18.0, 22.0, 36.0, 56.0, 60.0, 102.0, 112.0, 166.0, 246.0, 334.0, 644.0, 2070.0, 9036.0, 46324.0, 310888.0, 558504.0, 96448.0, 17400.0, 3628.0, 942.0, 450.0, 278.0, 188.0, 134.0, 94.0, 80.0, 64.0, 34.0, 36.0, 20.0, 21.0, 19.0, 12.0, 12.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-7.9609375, -7.7469482421875, -7.532958984375, -7.3189697265625, -7.10498046875, -6.8909912109375, -6.677001953125, -6.4630126953125, -6.2490234375, -6.0350341796875, -5.821044921875, -5.6070556640625, -5.39306640625, -5.1790771484375, -4.965087890625, -4.7510986328125, -4.537109375, -4.3231201171875, -4.109130859375, -3.8951416015625, -3.68115234375, -3.4671630859375, -3.253173828125, -3.0391845703125, -2.8251953125, -2.6112060546875, -2.397216796875, -2.1832275390625, -1.96923828125, -1.7552490234375, -1.541259765625, -1.3272705078125, -1.11328125, -0.8992919921875, -0.685302734375, -0.4713134765625, -0.25732421875, -0.0433349609375, 0.170654296875, 0.3846435546875, 0.5986328125, 0.8126220703125, 1.026611328125, 1.2406005859375, 1.45458984375, 1.6685791015625, 1.882568359375, 2.0965576171875, 2.310546875, 2.5245361328125, 2.738525390625, 2.9525146484375, 3.16650390625, 3.3804931640625, 3.594482421875, 3.8084716796875, 4.0224609375, 4.2364501953125, 4.450439453125, 4.6644287109375, 4.87841796875, 5.0924072265625, 5.306396484375, 5.5203857421875, 5.734375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 1.0, 12.0, 8.0, 9.0, 16.0, 15.0, 15.0, 13.0, 13.0, 17.0, 21.0, 29.0, 24.0, 34.0, 34.0, 43.0, 47.0, 58.0, 77.0, 211.0, 1548.0, 288.0, 97.0, 75.0, 39.0, 47.0, 28.0, 28.0, 31.0, 30.0, 22.0, 17.0, 14.0, 19.0, 15.0, 12.0, 11.0, 9.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.108154296875, -13.70068359375, -13.293212890625, -12.8857421875, -12.478271484375, -12.07080078125, -11.663330078125, -11.255859375, -10.848388671875, -10.44091796875, -10.033447265625, -9.6259765625, -9.218505859375, -8.81103515625, -8.403564453125, -7.99609375, -7.588623046875, -7.18115234375, -6.773681640625, -6.3662109375, -5.958740234375, -5.55126953125, -5.143798828125, -4.736328125, -4.328857421875, -3.92138671875, -3.513916015625, -3.1064453125, -2.698974609375, -2.29150390625, -1.884033203125, -1.4765625, -1.069091796875, -0.66162109375, -0.254150390625, 0.1533203125, 0.560791015625, 0.96826171875, 1.375732421875, 1.783203125, 2.190673828125, 2.59814453125, 3.005615234375, 3.4130859375, 3.820556640625, 4.22802734375, 4.635498046875, 5.04296875, 5.450439453125, 5.85791015625, 6.265380859375, 6.6728515625, 7.080322265625, 7.48779296875, 7.895263671875, 8.302734375, 8.710205078125, 9.11767578125, 9.525146484375, 9.9326171875, 10.340087890625, 10.74755859375, 11.155029296875, 11.5625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 9.0, 9.0, 12.0, 12.0, 18.0, 22.0, 26.0, 35.0, 48.0, 40.0, 67.0, 90.0, 113.0, 193.0, 319.0, 765.0, 2632.0, 212936.0, 2919316.0, 6657.0, 1047.0, 419.0, 276.0, 161.0, 125.0, 52.0, 56.0, 42.0, 33.0, 28.0, 25.0, 17.0, 23.0, 21.0, 10.0, 6.0, 12.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.3125, -28.37255859375, -27.4326171875, -26.49267578125, -25.552734375, -24.61279296875, -23.6728515625, -22.73291015625, -21.79296875, -20.85302734375, -19.9130859375, -18.97314453125, -18.033203125, -17.09326171875, -16.1533203125, -15.21337890625, -14.2734375, -13.33349609375, -12.3935546875, -11.45361328125, -10.513671875, -9.57373046875, -8.6337890625, -7.69384765625, -6.75390625, -5.81396484375, -4.8740234375, -3.93408203125, -2.994140625, -2.05419921875, -1.1142578125, -0.17431640625, 0.765625, 1.70556640625, 2.6455078125, 3.58544921875, 4.525390625, 5.46533203125, 6.4052734375, 7.34521484375, 8.28515625, 9.22509765625, 10.1650390625, 11.10498046875, 12.044921875, 12.98486328125, 13.9248046875, 14.86474609375, 15.8046875, 16.74462890625, 17.6845703125, 18.62451171875, 19.564453125, 20.50439453125, 21.4443359375, 22.38427734375, 23.32421875, 24.26416015625, 25.2041015625, 26.14404296875, 27.083984375, 28.02392578125, 28.9638671875, 29.90380859375, 30.84375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 39.0, 301.0, 507.0, 144.0, 21.0, 2.0], "bins": [-116.11796569824219, -114.19007873535156, -112.26219177246094, -110.33430480957031, -108.40641784667969, -106.47853088378906, -104.55064392089844, -102.62275695800781, -100.69486999511719, -98.76698303222656, -96.83909606933594, -94.91120910644531, -92.98332214355469, -91.05543518066406, -89.12754821777344, -87.19966125488281, -85.27177429199219, -83.34388732910156, -81.41600036621094, -79.48811340332031, -77.56022644042969, -75.63233947753906, -73.70445251464844, -71.77656555175781, -69.84867858886719, -67.92079162597656, -65.99290466308594, -64.06501770019531, -62.13713073730469, -60.20924377441406, -58.28135681152344, -56.35346984863281, -54.42558288574219, -52.49769592285156, -50.56980895996094, -48.64192199707031, -46.71403503417969, -44.78614807128906, -42.85826110839844, -40.93037414550781, -39.00248718261719, -37.07460021972656, -35.14671325683594, -33.21882629394531, -31.290939331054688, -29.363052368164062, -27.435165405273438, -25.507278442382812, -23.579391479492188, -21.651504516601562, -19.723617553710938, -17.795730590820312, -15.867843627929688, -13.939956665039062, -12.012069702148438, -10.084182739257812, -8.156296730041504, -6.228409767150879, -4.300522804260254, -2.372635841369629, -0.4447488784790039, 1.483138084411621, 3.411025047302246, 5.338912010192871, 7.266798973083496]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 3.0, 7.0, 6.0, 5.0, 8.0, 8.0, 2.0, 10.0, 6.0, 17.0, 9.0, 18.0, 19.0, 17.0, 22.0, 35.0, 36.0, 26.0, 36.0, 34.0, 19.0, 36.0, 44.0, 48.0, 37.0, 42.0, 37.0, 33.0, 41.0, 32.0, 37.0, 22.0, 30.0, 26.0, 27.0, 13.0, 21.0, 19.0, 17.0, 15.0, 18.0, 11.0, 6.0, 8.0, 11.0, 8.0, 8.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.790145874023438, -24.929243087768555, -24.068342208862305, -23.207439422607422, -22.346538543701172, -21.48563575744629, -20.624732971191406, -19.763832092285156, -18.902929306030273, -18.04202651977539, -17.18112564086914, -16.320222854614258, -15.459321022033691, -14.598419189453125, -13.737516403198242, -12.876614570617676, -12.01571273803711, -11.154810905456543, -10.293909072875977, -9.433006286621094, -8.572104454040527, -7.711202621459961, -6.850300312042236, -5.989398002624512, -5.128496170043945, -4.267594337463379, -3.4066920280456543, -2.545789957046509, -1.6848878860473633, -0.8239860534667969, 0.036916255950927734, 0.8978185653686523, 1.7587223052978516, 2.619624376296997, 3.4805264472961426, 4.341428756713867, 5.202330589294434, 6.063232421875, 6.924134731292725, 7.785037040710449, 8.645938873291016, 9.506840705871582, 10.367742538452148, 11.228645324707031, 12.089547157287598, 12.950448989868164, 13.811351776123047, 14.672253608703613, 15.53315544128418, 16.394058227539062, 17.254959106445312, 18.115861892700195, 18.976764678955078, 19.837665557861328, 20.69856834411621, 21.559471130371094, 22.420372009277344, 23.281274795532227, 24.142175674438477, 25.00307846069336, 25.86397933959961, 26.724882125854492, 27.585784912109375, 28.446685791015625, 29.307588577270508]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 2.0, 10.0, 12.0, 9.0, 13.0, 13.0, 17.0, 21.0, 25.0, 34.0, 46.0, 40.0, 42.0, 43.0, 50.0, 40.0, 41.0, 47.0, 33.0, 44.0, 42.0, 40.0, 28.0, 34.0, 36.0, 33.0, 33.0, 26.0, 37.0, 20.0, 19.0, 8.0, 11.0, 16.0, 4.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.9453125, -4.806671142578125, -4.66802978515625, -4.529388427734375, -4.3907470703125, -4.252105712890625, -4.11346435546875, -3.974822998046875, -3.836181640625, -3.697540283203125, -3.55889892578125, -3.420257568359375, -3.2816162109375, -3.142974853515625, -3.00433349609375, -2.865692138671875, -2.72705078125, -2.588409423828125, -2.44976806640625, -2.311126708984375, -2.1724853515625, -2.033843994140625, -1.89520263671875, -1.756561279296875, -1.617919921875, -1.479278564453125, -1.34063720703125, -1.201995849609375, -1.0633544921875, -0.924713134765625, -0.78607177734375, -0.647430419921875, -0.5087890625, -0.370147705078125, -0.23150634765625, -0.092864990234375, 0.0457763671875, 0.184417724609375, 0.32305908203125, 0.461700439453125, 0.600341796875, 0.738983154296875, 0.87762451171875, 1.016265869140625, 1.1549072265625, 1.293548583984375, 1.43218994140625, 1.570831298828125, 1.70947265625, 1.848114013671875, 1.98675537109375, 2.125396728515625, 2.2640380859375, 2.402679443359375, 2.54132080078125, 2.679962158203125, 2.818603515625, 2.957244873046875, 3.09588623046875, 3.234527587890625, 3.3731689453125, 3.511810302734375, 3.65045166015625, 3.789093017578125, 3.927734375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 6.0, 6.0, 7.0, 9.0, 10.0, 19.0, 13.0, 19.0, 29.0, 27.0, 41.0, 57.0, 82.0, 104.0, 168.0, 432.0, 1369.0, 22604.0, 1271267.0, 2771432.0, 122150.0, 3113.0, 607.0, 236.0, 123.0, 74.0, 52.0, 41.0, 43.0, 29.0, 28.0, 19.0, 21.0, 12.0, 10.0, 9.0, 8.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.490966796875, -11.12255859375, -10.754150390625, -10.3857421875, -10.017333984375, -9.64892578125, -9.280517578125, -8.912109375, -8.543701171875, -8.17529296875, -7.806884765625, -7.4384765625, -7.070068359375, -6.70166015625, -6.333251953125, -5.96484375, -5.596435546875, -5.22802734375, -4.859619140625, -4.4912109375, -4.122802734375, -3.75439453125, -3.385986328125, -3.017578125, -2.649169921875, -2.28076171875, -1.912353515625, -1.5439453125, -1.175537109375, -0.80712890625, -0.438720703125, -0.0703125, 0.298095703125, 0.66650390625, 1.034912109375, 1.4033203125, 1.771728515625, 2.14013671875, 2.508544921875, 2.876953125, 3.245361328125, 3.61376953125, 3.982177734375, 4.3505859375, 4.718994140625, 5.08740234375, 5.455810546875, 5.82421875, 6.192626953125, 6.56103515625, 6.929443359375, 7.2978515625, 7.666259765625, 8.03466796875, 8.403076171875, 8.771484375, 9.139892578125, 9.50830078125, 9.876708984375, 10.2451171875, 10.613525390625, 10.98193359375, 11.350341796875, 11.71875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 8.0, 15.0, 21.0, 32.0, 29.0, 64.0, 85.0, 112.0, 159.0, 239.0, 303.0, 384.0, 504.0, 502.0, 413.0, 350.0, 241.0, 187.0, 132.0, 90.0, 56.0, 37.0, 28.0, 12.0, 15.0, 10.0, 4.0, 8.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.734375, -7.52655029296875, -7.3187255859375, -7.11090087890625, -6.903076171875, -6.69525146484375, -6.4874267578125, -6.27960205078125, -6.07177734375, -5.86395263671875, -5.6561279296875, -5.44830322265625, -5.240478515625, -5.03265380859375, -4.8248291015625, -4.61700439453125, -4.4091796875, -4.20135498046875, -3.9935302734375, -3.78570556640625, -3.577880859375, -3.37005615234375, -3.1622314453125, -2.95440673828125, -2.74658203125, -2.53875732421875, -2.3309326171875, -2.12310791015625, -1.915283203125, -1.70745849609375, -1.4996337890625, -1.29180908203125, -1.083984375, -0.87615966796875, -0.6683349609375, -0.46051025390625, -0.252685546875, -0.04486083984375, 0.1629638671875, 0.37078857421875, 0.57861328125, 0.78643798828125, 0.9942626953125, 1.20208740234375, 1.409912109375, 1.61773681640625, 1.8255615234375, 2.03338623046875, 2.2412109375, 2.44903564453125, 2.6568603515625, 2.86468505859375, 3.072509765625, 3.28033447265625, 3.4881591796875, 3.69598388671875, 3.90380859375, 4.11163330078125, 4.3194580078125, 4.52728271484375, 4.735107421875, 4.94293212890625, 5.1507568359375, 5.35858154296875, 5.56640625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 16.0, 14.0, 27.0, 22.0, 48.0, 63.0, 84.0, 120.0, 119.0, 258.0, 344.0, 598.0, 1553.0, 9364.0, 340108.0, 3670567.0, 161856.0, 6065.0, 1301.0, 557.0, 341.0, 242.0, 158.0, 130.0, 90.0, 53.0, 43.0, 38.0, 26.0, 12.0, 11.0, 13.0, 9.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5859375, -14.0726318359375, -13.559326171875, -13.0460205078125, -12.53271484375, -12.0194091796875, -11.506103515625, -10.9927978515625, -10.4794921875, -9.9661865234375, -9.452880859375, -8.9395751953125, -8.42626953125, -7.9129638671875, -7.399658203125, -6.8863525390625, -6.373046875, -5.8597412109375, -5.346435546875, -4.8331298828125, -4.31982421875, -3.8065185546875, -3.293212890625, -2.7799072265625, -2.2666015625, -1.7532958984375, -1.239990234375, -0.7266845703125, -0.21337890625, 0.2999267578125, 0.813232421875, 1.3265380859375, 1.83984375, 2.3531494140625, 2.866455078125, 3.3797607421875, 3.89306640625, 4.4063720703125, 4.919677734375, 5.4329833984375, 5.9462890625, 6.4595947265625, 6.972900390625, 7.4862060546875, 7.99951171875, 8.5128173828125, 9.026123046875, 9.5394287109375, 10.052734375, 10.5660400390625, 11.079345703125, 11.5926513671875, 12.10595703125, 12.6192626953125, 13.132568359375, 13.6458740234375, 14.1591796875, 14.6724853515625, 15.185791015625, 15.6990966796875, 16.21240234375, 16.7257080078125, 17.239013671875, 17.7523193359375, 18.265625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 42.0, 150.0, 266.0, 317.0, 159.0, 50.0, 16.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.89935302734375, -65.1007080078125, -63.30207061767578, -61.5034294128418, -59.70478820800781, -57.90614700317383, -56.107505798339844, -54.30886459350586, -52.510223388671875, -50.71158218383789, -48.912940979003906, -47.11429977416992, -45.31565856933594, -43.51701736450195, -41.71837615966797, -39.919734954833984, -38.12109375, -36.322452545166016, -34.52381134033203, -32.72517013549805, -30.926528930664062, -29.127887725830078, -27.329246520996094, -25.53060531616211, -23.73196029663086, -21.933319091796875, -20.13467788696289, -18.336036682128906, -16.537395477294922, -14.738753318786621, -12.940112113952637, -11.141470909118652, -9.342830657958984, -7.544189453125, -5.745548248291016, -3.946906566619873, -2.1482653617858887, -0.3496236801147461, 1.4490175247192383, 3.2476587295532227, 5.046299934387207, 6.844941139221191, 8.643582344055176, 10.442224502563477, 12.240865707397461, 14.039506912231445, 15.83814811706543, 17.636789321899414, 19.4354305267334, 21.234071731567383, 23.032712936401367, 24.83135414123535, 26.629995346069336, 28.428638458251953, 30.227279663085938, 32.02592086791992, 33.824562072753906, 35.62320327758789, 37.421844482421875, 39.22048568725586, 41.019126892089844, 42.81776809692383, 44.61640930175781, 46.4150505065918, 48.21369171142578]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 7.0, 9.0, 14.0, 16.0, 19.0, 29.0, 20.0, 25.0, 20.0, 29.0, 42.0, 32.0, 37.0, 46.0, 41.0, 48.0, 40.0, 40.0, 38.0, 43.0, 39.0, 46.0, 36.0, 28.0, 36.0, 35.0, 33.0, 19.0, 11.0, 19.0, 14.0, 19.0, 14.0, 14.0, 9.0, 10.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.433757781982422, -21.74953269958496, -21.065309524536133, -20.381084442138672, -19.696861267089844, -19.012636184692383, -18.328411102294922, -17.644187927246094, -16.959962844848633, -16.275737762451172, -15.591514587402344, -14.907289505004883, -14.223065376281738, -13.538841247558594, -12.854616165161133, -12.170392036437988, -11.486167907714844, -10.8019437789917, -10.117719650268555, -9.433494567871094, -8.74927043914795, -8.065046310424805, -7.380821704864502, -6.696597099304199, -6.012372970581055, -5.32814884185791, -4.643924236297607, -3.959699869155884, -3.27547550201416, -2.5912511348724365, -1.907026767730713, -1.2228021621704102, -0.5385780334472656, 0.145646333694458, 0.8298707008361816, 1.5140950679779053, 2.198319435119629, 2.8825438022613525, 3.566768169403076, 4.250992774963379, 4.935216903686523, 5.619441032409668, 6.303665637969971, 6.987890243530273, 7.672114372253418, 8.356338500976562, 9.040563583374023, 9.724787712097168, 10.409011840820312, 11.093235969543457, 11.777460098266602, 12.461685180664062, 13.145909309387207, 13.830133438110352, 14.514358520507812, 15.198582649230957, 15.882806777954102, 16.567031860351562, 17.25125503540039, 17.93548011779785, 18.619705200195312, 19.30392837524414, 19.9881534576416, 20.672378540039062, 21.35660171508789]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 9.0, 10.0, 14.0, 16.0, 17.0, 21.0, 26.0, 19.0, 36.0, 24.0, 33.0, 27.0, 35.0, 40.0, 39.0, 41.0, 38.0, 45.0, 38.0, 53.0, 26.0, 40.0, 29.0, 31.0, 36.0, 36.0, 26.0, 30.0, 22.0, 24.0, 22.0, 13.0, 14.0, 14.0, 12.0, 6.0, 6.0, 6.0, 1.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.86309814453125, -3.7379150390625, -3.61273193359375, -3.487548828125, -3.36236572265625, -3.2371826171875, -3.11199951171875, -2.98681640625, -2.86163330078125, -2.7364501953125, -2.61126708984375, -2.486083984375, -2.36090087890625, -2.2357177734375, -2.11053466796875, -1.9853515625, -1.86016845703125, -1.7349853515625, -1.60980224609375, -1.484619140625, -1.35943603515625, -1.2342529296875, -1.10906982421875, -0.98388671875, -0.85870361328125, -0.7335205078125, -0.60833740234375, -0.483154296875, -0.35797119140625, -0.2327880859375, -0.10760498046875, 0.017578125, 0.14276123046875, 0.2679443359375, 0.39312744140625, 0.518310546875, 0.64349365234375, 0.7686767578125, 0.89385986328125, 1.01904296875, 1.14422607421875, 1.2694091796875, 1.39459228515625, 1.519775390625, 1.64495849609375, 1.7701416015625, 1.89532470703125, 2.0205078125, 2.14569091796875, 2.2708740234375, 2.39605712890625, 2.521240234375, 2.64642333984375, 2.7716064453125, 2.89678955078125, 3.02197265625, 3.14715576171875, 3.2723388671875, 3.39752197265625, 3.522705078125, 3.64788818359375, 3.7730712890625, 3.89825439453125, 4.0234375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 5.0, 9.0, 22.0, 29.0, 39.0, 71.0, 104.0, 126.0, 232.0, 377.0, 617.0, 989.0, 1568.0, 2436.0, 4054.0, 6472.0, 10800.0, 17945.0, 29946.0, 52393.0, 97591.0, 236002.0, 314240.0, 122082.0, 61900.0, 35485.0, 20680.0, 12501.0, 7597.0, 4594.0, 2875.0, 1751.0, 1125.0, 680.0, 448.0, 261.0, 177.0, 119.0, 65.0, 42.0, 35.0, 19.0, 15.0, 14.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.84619140625, -0.8206634521484375, -0.795135498046875, -0.7696075439453125, -0.74407958984375, -0.7185516357421875, -0.693023681640625, -0.6674957275390625, -0.6419677734375, -0.6164398193359375, -0.590911865234375, -0.5653839111328125, -0.53985595703125, -0.5143280029296875, -0.488800048828125, -0.4632720947265625, -0.437744140625, -0.4122161865234375, -0.386688232421875, -0.3611602783203125, -0.33563232421875, -0.3101043701171875, -0.284576416015625, -0.2590484619140625, -0.2335205078125, -0.2079925537109375, -0.182464599609375, -0.1569366455078125, -0.13140869140625, -0.1058807373046875, -0.080352783203125, -0.0548248291015625, -0.029296875, -0.0037689208984375, 0.021759033203125, 0.0472869873046875, 0.07281494140625, 0.0983428955078125, 0.123870849609375, 0.1493988037109375, 0.1749267578125, 0.2004547119140625, 0.225982666015625, 0.2515106201171875, 0.27703857421875, 0.3025665283203125, 0.328094482421875, 0.3536224365234375, 0.379150390625, 0.4046783447265625, 0.430206298828125, 0.4557342529296875, 0.48126220703125, 0.5067901611328125, 0.532318115234375, 0.5578460693359375, 0.5833740234375, 0.6089019775390625, 0.634429931640625, 0.6599578857421875, 0.68548583984375, 0.7110137939453125, 0.736541748046875, 0.7620697021484375, 0.78759765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 6.0, 10.0, 9.0, 7.0, 15.0, 11.0, 9.0, 8.0, 13.0, 15.0, 29.0, 31.0, 14.0, 22.0, 29.0, 24.0, 34.0, 25.0, 28.0, 37.0, 38.0, 28.0, 38.0, 1050.0, 32.0, 39.0, 38.0, 37.0, 31.0, 31.0, 38.0, 26.0, 25.0, 20.0, 24.0, 19.0, 11.0, 23.0, 14.0, 13.0, 15.0, 10.0, 12.0, 10.0, 4.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.0703125, -2.00360107421875, -1.9368896484375, -1.87017822265625, -1.803466796875, -1.73675537109375, -1.6700439453125, -1.60333251953125, -1.53662109375, -1.46990966796875, -1.4031982421875, -1.33648681640625, -1.269775390625, -1.20306396484375, -1.1363525390625, -1.06964111328125, -1.0029296875, -0.93621826171875, -0.8695068359375, -0.80279541015625, -0.736083984375, -0.66937255859375, -0.6026611328125, -0.53594970703125, -0.46923828125, -0.40252685546875, -0.3358154296875, -0.26910400390625, -0.202392578125, -0.13568115234375, -0.0689697265625, -0.00225830078125, 0.064453125, 0.13116455078125, 0.1978759765625, 0.26458740234375, 0.331298828125, 0.39801025390625, 0.4647216796875, 0.53143310546875, 0.59814453125, 0.66485595703125, 0.7315673828125, 0.79827880859375, 0.864990234375, 0.93170166015625, 0.9984130859375, 1.06512451171875, 1.1318359375, 1.19854736328125, 1.2652587890625, 1.33197021484375, 1.398681640625, 1.46539306640625, 1.5321044921875, 1.59881591796875, 1.66552734375, 1.73223876953125, 1.7989501953125, 1.86566162109375, 1.932373046875, 1.99908447265625, 2.0657958984375, 2.13250732421875, 2.19921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 3.0, 8.0, 11.0, 9.0, 18.0, 39.0, 53.0, 52.0, 103.0, 158.0, 253.0, 330.0, 469.0, 743.0, 1016.0, 1511.0, 2075.0, 3073.0, 4284.0, 6291.0, 9141.0, 13337.0, 19867.0, 30493.0, 47845.0, 78366.0, 142936.0, 1306025.0, 175759.0, 92696.0, 54916.0, 34461.0, 22846.0, 14815.0, 10109.0, 6943.0, 4952.0, 3418.0, 2405.0, 1604.0, 1220.0, 807.0, 516.0, 416.0, 243.0, 163.0, 120.0, 81.0, 53.0, 28.0, 23.0, 16.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.59814453125, -0.5792465209960938, -0.5603485107421875, -0.5414505004882812, -0.522552490234375, -0.5036544799804688, -0.4847564697265625, -0.46585845947265625, -0.44696044921875, -0.42806243896484375, -0.4091644287109375, -0.39026641845703125, -0.371368408203125, -0.35247039794921875, -0.3335723876953125, -0.31467437744140625, -0.2957763671875, -0.27687835693359375, -0.2579803466796875, -0.23908233642578125, -0.220184326171875, -0.20128631591796875, -0.1823883056640625, -0.16349029541015625, -0.14459228515625, -0.12569427490234375, -0.1067962646484375, -0.08789825439453125, -0.069000244140625, -0.05010223388671875, -0.0312042236328125, -0.01230621337890625, 0.006591796875, 0.02548980712890625, 0.0443878173828125, 0.06328582763671875, 0.082183837890625, 0.10108184814453125, 0.1199798583984375, 0.13887786865234375, 0.15777587890625, 0.17667388916015625, 0.1955718994140625, 0.21446990966796875, 0.233367919921875, 0.25226593017578125, 0.2711639404296875, 0.29006195068359375, 0.3089599609375, 0.32785797119140625, 0.3467559814453125, 0.36565399169921875, 0.384552001953125, 0.40345001220703125, 0.4223480224609375, 0.44124603271484375, 0.46014404296875, 0.47904205322265625, 0.4979400634765625, 0.5168380737304688, 0.535736083984375, 0.5546340942382812, 0.5735321044921875, 0.5924301147460938, 0.611328125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 2.0, 11.0, 12.0, 11.0, 12.0, 10.0, 19.0, 26.0, 25.0, 33.0, 33.0, 37.0, 43.0, 43.0, 45.0, 34.0, 70.0, 40.0, 59.0, 44.0, 54.0, 47.0, 42.0, 41.0, 27.0, 36.0, 19.0, 23.0, 18.0, 9.0, 13.0, 15.0, 7.0, 8.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.0004208087921142578, -0.00040893256664276123, -0.00039705634117126465, -0.00038518011569976807, -0.0003733038902282715, -0.0003614276647567749, -0.0003495514392852783, -0.00033767521381378174, -0.00032579898834228516, -0.0003139227628707886, -0.000302046537399292, -0.0002901703119277954, -0.00027829408645629883, -0.00026641786098480225, -0.00025454163551330566, -0.00024266541004180908, -0.0002307891845703125, -0.00021891295909881592, -0.00020703673362731934, -0.00019516050815582275, -0.00018328428268432617, -0.0001714080572128296, -0.000159531831741333, -0.00014765560626983643, -0.00013577938079833984, -0.00012390315532684326, -0.00011202692985534668, -0.0001001507043838501, -8.827447891235352e-05, -7.639825344085693e-05, -6.452202796936035e-05, -5.264580249786377e-05, -4.076957702636719e-05, -2.8893351554870605e-05, -1.7017126083374023e-05, -5.140900611877441e-06, 6.735324859619141e-06, 1.8611550331115723e-05, 3.0487775802612305e-05, 4.236400127410889e-05, 5.424022674560547e-05, 6.611645221710205e-05, 7.799267768859863e-05, 8.986890316009521e-05, 0.0001017451286315918, 0.00011362135410308838, 0.00012549757957458496, 0.00013737380504608154, 0.00014925003051757812, 0.0001611262559890747, 0.0001730024814605713, 0.00018487870693206787, 0.00019675493240356445, 0.00020863115787506104, 0.00022050738334655762, 0.0002323836088180542, 0.0002442598342895508, 0.00025613605976104736, 0.00026801228523254395, 0.00027988851070404053, 0.0002917647361755371, 0.0003036409616470337, 0.0003155171871185303, 0.00032739341259002686, 0.00033926963806152344]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 7.0, 9.0, 11.0, 14.0, 15.0, 21.0, 30.0, 33.0, 42.0, 52.0, 76.0, 91.0, 108.0, 212.0, 310.0, 559.0, 1446.0, 627563.0, 415057.0, 1296.0, 577.0, 299.0, 162.0, 119.0, 96.0, 68.0, 52.0, 48.0, 28.0, 27.0, 21.0, 16.0, 16.0, 18.0, 9.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007129669189453125, -0.006883561611175537, -0.006637454032897949, -0.006391346454620361, -0.0061452388763427734, -0.0058991312980651855, -0.005653023719787598, -0.00540691614151001, -0.005160808563232422, -0.004914700984954834, -0.004668593406677246, -0.004422485828399658, -0.00417637825012207, -0.003930270671844482, -0.0036841630935668945, -0.0034380555152893066, -0.0031919479370117188, -0.002945840358734131, -0.002699732780456543, -0.002453625202178955, -0.002207517623901367, -0.0019614100456237793, -0.0017153024673461914, -0.0014691948890686035, -0.0012230873107910156, -0.0009769797325134277, -0.0007308721542358398, -0.00048476457595825195, -0.00023865699768066406, 7.450580596923828e-06, 0.0002535581588745117, 0.0004996657371520996, 0.0007457733154296875, 0.0009918808937072754, 0.0012379884719848633, 0.0014840960502624512, 0.001730203628540039, 0.001976311206817627, 0.002222418785095215, 0.0024685263633728027, 0.0027146339416503906, 0.0029607415199279785, 0.0032068490982055664, 0.0034529566764831543, 0.003699064254760742, 0.00394517183303833, 0.004191279411315918, 0.004437386989593506, 0.004683494567871094, 0.004929602146148682, 0.0051757097244262695, 0.005421817302703857, 0.005667924880981445, 0.005914032459259033, 0.006160140037536621, 0.006406247615814209, 0.006652355194091797, 0.006898462772369385, 0.007144570350646973, 0.0073906779289245605, 0.0076367855072021484, 0.007882893085479736, 0.008129000663757324, 0.008375108242034912, 0.0086212158203125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 57.0, 706.0, 243.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015413217479363084, -0.0014942148700356483, -0.0014471081085503101, -0.00140000123064965, -0.00135289435274899, -0.00130578747484833, -0.00125868059694767, -0.0012115738354623318, -0.0011644669575616717, -0.0011173600796610117, -0.0010702533181756735, -0.0010231464402750134, -0.0009760395623743534, -0.0009289326844736934, -0.0008818258647806942, -0.0008347190450876951, -0.0007876121671870351, -0.000740505289286375, -0.0006933984695933759, -0.0006462916499003768, -0.0005991847719997168, -0.0005520778940990567, -0.0005049710744060576, -0.000457864225609228, -0.00041075737681239843, -0.00036365052801556885, -0.00031654367921873927, -0.0002694368304219097, -0.0002223299816250801, -0.00017522313282825053, -0.00012811628403142095, -8.100943523459136e-05, -3.390270285308361e-05, 1.320414594374597e-05, 6.031099474057555e-05, 0.00010741784353740513, 0.00015452469233423471, 0.0002016315411310643, 0.0002487383899278939, 0.00029584523872472346, 0.00034295208752155304, 0.0003900589363183826, 0.0004371657851152122, 0.0004842726339120418, 0.0005313794827088714, 0.0005784863606095314, 0.0006255931803025305, 0.0006726999999955297, 0.0007198068778961897, 0.0007669137557968497, 0.0008140205754898489, 0.000861127395182848, 0.000908234273083508, 0.000955341150984168, 0.0010024479124695063, 0.0010495547903701663, 0.0010966616682708263, 0.0011437685461714864, 0.0011908754240721464, 0.0012379821855574846, 0.0012850890634581447, 0.0013321959413588047, 0.001379302702844143, 0.001426409580744803, 0.001473516458645463]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 7.0, 7.0, 11.0, 18.0, 23.0, 23.0, 23.0, 19.0, 35.0, 35.0, 43.0, 43.0, 32.0, 39.0, 42.0, 37.0, 50.0, 49.0, 28.0, 44.0, 42.0, 45.0, 37.0, 34.0, 36.0, 27.0, 27.0, 25.0, 18.0, 23.0, 17.0, 12.0, 9.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002117156982421875, -0.00020445510745048523, -0.00019719451665878296, -0.0001899339258670807, -0.00018267333507537842, -0.00017541274428367615, -0.00016815215349197388, -0.0001608915627002716, -0.00015363097190856934, -0.00014637038111686707, -0.0001391097903251648, -0.00013184919953346252, -0.00012458860874176025, -0.00011732801795005798, -0.00011006742715835571, -0.00010280683636665344, -9.554624557495117e-05, -8.82856547832489e-05, -8.102506399154663e-05, -7.376447319984436e-05, -6.650388240814209e-05, -5.924329161643982e-05, -5.198270082473755e-05, -4.472211003303528e-05, -3.746151924133301e-05, -3.0200928449630737e-05, -2.2940337657928467e-05, -1.5679746866226196e-05, -8.419156074523926e-06, -1.1585652828216553e-06, 6.102025508880615e-06, 1.3362616300582886e-05, 2.0623207092285156e-05, 2.7883797883987427e-05, 3.51443886756897e-05, 4.240497946739197e-05, 4.966557025909424e-05, 5.692616105079651e-05, 6.418675184249878e-05, 7.144734263420105e-05, 7.870793342590332e-05, 8.596852421760559e-05, 9.322911500930786e-05, 0.00010048970580101013, 0.0001077502965927124, 0.00011501088738441467, 0.00012227147817611694, 0.00012953206896781921, 0.00013679265975952148, 0.00014405325055122375, 0.00015131384134292603, 0.0001585744321346283, 0.00016583502292633057, 0.00017309561371803284, 0.0001803562045097351, 0.00018761679530143738, 0.00019487738609313965, 0.00020213797688484192, 0.0002093985676765442, 0.00021665915846824646, 0.00022391974925994873, 0.000231180340051651, 0.00023844093084335327, 0.00024570152163505554, 0.0002529621124267578]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 9.0, 10.0, 14.0, 16.0, 17.0, 21.0, 26.0, 19.0, 36.0, 24.0, 33.0, 27.0, 35.0, 40.0, 39.0, 41.0, 38.0, 45.0, 38.0, 53.0, 26.0, 40.0, 29.0, 31.0, 36.0, 36.0, 26.0, 30.0, 22.0, 24.0, 22.0, 13.0, 14.0, 14.0, 12.0, 6.0, 6.0, 6.0, 1.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.86309814453125, -3.7379150390625, -3.61273193359375, -3.487548828125, -3.36236572265625, -3.2371826171875, -3.11199951171875, -2.98681640625, -2.86163330078125, -2.7364501953125, -2.61126708984375, -2.486083984375, -2.36090087890625, -2.2357177734375, -2.11053466796875, -1.9853515625, -1.86016845703125, -1.7349853515625, -1.60980224609375, -1.484619140625, -1.35943603515625, -1.2342529296875, -1.10906982421875, -0.98388671875, -0.85870361328125, -0.7335205078125, -0.60833740234375, -0.483154296875, -0.35797119140625, -0.2327880859375, -0.10760498046875, 0.017578125, 0.14276123046875, 0.2679443359375, 0.39312744140625, 0.518310546875, 0.64349365234375, 0.7686767578125, 0.89385986328125, 1.01904296875, 1.14422607421875, 1.2694091796875, 1.39459228515625, 1.519775390625, 1.64495849609375, 1.7701416015625, 1.89532470703125, 2.0205078125, 2.14569091796875, 2.2708740234375, 2.39605712890625, 2.521240234375, 2.64642333984375, 2.7716064453125, 2.89678955078125, 3.02197265625, 3.14715576171875, 3.2723388671875, 3.39752197265625, 3.522705078125, 3.64788818359375, 3.7730712890625, 3.89825439453125, 4.0234375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 8.0, 7.0, 11.0, 9.0, 20.0, 24.0, 39.0, 44.0, 60.0, 91.0, 98.0, 151.0, 219.0, 269.0, 346.0, 485.0, 742.0, 1425.0, 4955.0, 28368.0, 311394.0, 638872.0, 48429.0, 7709.0, 1858.0, 820.0, 544.0, 404.0, 321.0, 221.0, 141.0, 113.0, 100.0, 65.0, 44.0, 37.0, 29.0, 25.0, 19.0, 9.0, 6.0, 2.0, 6.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.7418212890625, -9.428955078125, -9.1160888671875, -8.80322265625, -8.4903564453125, -8.177490234375, -7.8646240234375, -7.5517578125, -7.2388916015625, -6.926025390625, -6.6131591796875, -6.30029296875, -5.9874267578125, -5.674560546875, -5.3616943359375, -5.048828125, -4.7359619140625, -4.423095703125, -4.1102294921875, -3.79736328125, -3.4844970703125, -3.171630859375, -2.8587646484375, -2.5458984375, -2.2330322265625, -1.920166015625, -1.6072998046875, -1.29443359375, -0.9815673828125, -0.668701171875, -0.3558349609375, -0.04296875, 0.2698974609375, 0.582763671875, 0.8956298828125, 1.20849609375, 1.5213623046875, 1.834228515625, 2.1470947265625, 2.4599609375, 2.7728271484375, 3.085693359375, 3.3985595703125, 3.71142578125, 4.0242919921875, 4.337158203125, 4.6500244140625, 4.962890625, 5.2757568359375, 5.588623046875, 5.9014892578125, 6.21435546875, 6.5272216796875, 6.840087890625, 7.1529541015625, 7.4658203125, 7.7786865234375, 8.091552734375, 8.4044189453125, 8.71728515625, 9.0301513671875, 9.343017578125, 9.6558837890625, 9.96875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 11.0, 5.0, 16.0, 16.0, 18.0, 20.0, 32.0, 23.0, 39.0, 30.0, 34.0, 39.0, 59.0, 56.0, 86.0, 180.0, 1621.0, 274.0, 94.0, 74.0, 39.0, 45.0, 39.0, 43.0, 26.0, 27.0, 20.0, 14.0, 13.0, 17.0, 7.0, 11.0, 11.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.0604248046875, -14.613037109375, -14.1656494140625, -13.71826171875, -13.2708740234375, -12.823486328125, -12.3760986328125, -11.9287109375, -11.4813232421875, -11.033935546875, -10.5865478515625, -10.13916015625, -9.6917724609375, -9.244384765625, -8.7969970703125, -8.349609375, -7.9022216796875, -7.454833984375, -7.0074462890625, -6.56005859375, -6.1126708984375, -5.665283203125, -5.2178955078125, -4.7705078125, -4.3231201171875, -3.875732421875, -3.4283447265625, -2.98095703125, -2.5335693359375, -2.086181640625, -1.6387939453125, -1.19140625, -0.7440185546875, -0.296630859375, 0.1507568359375, 0.59814453125, 1.0455322265625, 1.492919921875, 1.9403076171875, 2.3876953125, 2.8350830078125, 3.282470703125, 3.7298583984375, 4.17724609375, 4.6246337890625, 5.072021484375, 5.5194091796875, 5.966796875, 6.4141845703125, 6.861572265625, 7.3089599609375, 7.75634765625, 8.2037353515625, 8.651123046875, 9.0985107421875, 9.5458984375, 9.9932861328125, 10.440673828125, 10.8880615234375, 11.33544921875, 11.7828369140625, 12.230224609375, 12.6776123046875, 13.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 9.0, 13.0, 15.0, 10.0, 21.0, 16.0, 21.0, 40.0, 53.0, 49.0, 75.0, 111.0, 193.0, 307.0, 769.0, 3352.0, 1588569.0, 1546780.0, 3514.0, 732.0, 324.0, 209.0, 125.0, 85.0, 58.0, 52.0, 40.0, 25.0, 32.0, 17.0, 10.0, 22.0, 12.0, 11.0, 9.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4375, -33.28955078125, -32.1416015625, -30.99365234375, -29.845703125, -28.69775390625, -27.5498046875, -26.40185546875, -25.25390625, -24.10595703125, -22.9580078125, -21.81005859375, -20.662109375, -19.51416015625, -18.3662109375, -17.21826171875, -16.0703125, -14.92236328125, -13.7744140625, -12.62646484375, -11.478515625, -10.33056640625, -9.1826171875, -8.03466796875, -6.88671875, -5.73876953125, -4.5908203125, -3.44287109375, -2.294921875, -1.14697265625, 0.0009765625, 1.14892578125, 2.296875, 3.44482421875, 4.5927734375, 5.74072265625, 6.888671875, 8.03662109375, 9.1845703125, 10.33251953125, 11.48046875, 12.62841796875, 13.7763671875, 14.92431640625, 16.072265625, 17.22021484375, 18.3681640625, 19.51611328125, 20.6640625, 21.81201171875, 22.9599609375, 24.10791015625, 25.255859375, 26.40380859375, 27.5517578125, 28.69970703125, 29.84765625, 30.99560546875, 32.1435546875, 33.29150390625, 34.439453125, 35.58740234375, 36.7353515625, 37.88330078125, 39.03125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 46.0, 157.0, 291.0, 281.0, 162.0, 50.0, 13.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.175193786621094, -38.2205810546875, -37.26596450805664, -36.31134796142578, -35.35673522949219, -34.402122497558594, -33.447505950927734, -32.492889404296875, -31.53827667236328, -30.583662033081055, -29.629047393798828, -28.6744327545166, -27.719818115234375, -26.76520347595215, -25.810588836669922, -24.855974197387695, -23.90135955810547, -22.946744918823242, -21.992130279541016, -21.03751564025879, -20.082901000976562, -19.128286361694336, -18.17367172241211, -17.219057083129883, -16.264442443847656, -15.30982780456543, -14.355213165283203, -13.400598526000977, -12.44598388671875, -11.491369247436523, -10.536754608154297, -9.58213996887207, -8.627527236938477, -7.67291259765625, -6.718297958374023, -5.763683319091797, -4.80906867980957, -3.8544540405273438, -2.899839401245117, -1.9452247619628906, -0.9906101226806641, -0.0359954833984375, 0.9186191558837891, 1.8732337951660156, 2.827848434448242, 3.7824630737304688, 4.737077713012695, 5.691692352294922, 6.646306991577148, 7.600921630859375, 8.555536270141602, 9.510150909423828, 10.464765548706055, 11.419380187988281, 12.373994827270508, 13.328609466552734, 14.283224105834961, 15.237838745117188, 16.192453384399414, 17.14706802368164, 18.101682662963867, 19.056297302246094, 20.01091194152832, 20.965526580810547, 21.920141220092773]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 7.0, 4.0, 6.0, 8.0, 15.0, 11.0, 13.0, 14.0, 12.0, 26.0, 15.0, 19.0, 29.0, 26.0, 34.0, 29.0, 38.0, 37.0, 45.0, 34.0, 47.0, 32.0, 40.0, 48.0, 39.0, 34.0, 36.0, 33.0, 35.0, 23.0, 37.0, 17.0, 24.0, 24.0, 14.0, 17.0, 13.0, 15.0, 19.0, 3.0, 4.0, 3.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.897613525390625, -25.985258102416992, -25.07290267944336, -24.16054916381836, -23.248193740844727, -22.335838317871094, -21.42348289489746, -20.511127471923828, -19.598772048950195, -18.686416625976562, -17.77406120300293, -16.861705780029297, -15.94935131072998, -15.036996841430664, -14.124641418457031, -13.212285995483398, -12.299931526184082, -11.38757610321045, -10.475221633911133, -9.5628662109375, -8.650510787963867, -7.738155841827393, -6.825800895690918, -5.913445472717285, -5.0010905265808105, -4.088735580444336, -3.176380157470703, -2.2640252113342285, -1.3516700267791748, -0.4393148422241211, 0.4730401039123535, 1.3853955268859863, 2.297750473022461, 3.2101056575775146, 4.122460842132568, 5.034815788269043, 5.947171211242676, 6.85952615737915, 7.771881103515625, 8.684236526489258, 9.59659194946289, 10.508947372436523, 11.42130184173584, 12.333657264709473, 13.246012687683105, 14.158367156982422, 15.070722579956055, 15.983078002929688, 16.895431518554688, 17.80778694152832, 18.720142364501953, 19.632495880126953, 20.544851303100586, 21.45720672607422, 22.36956214904785, 23.281917572021484, 24.194272994995117, 25.10662841796875, 26.018983840942383, 26.931339263916016, 27.843692779541016, 28.75604820251465, 29.66840362548828, 30.580759048461914, 31.493114471435547]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 10.0, 8.0, 10.0, 11.0, 6.0, 8.0, 26.0, 13.0, 17.0, 24.0, 28.0, 37.0, 31.0, 33.0, 35.0, 40.0, 36.0, 46.0, 43.0, 47.0, 44.0, 48.0, 43.0, 32.0, 40.0, 26.0, 27.0, 35.0, 26.0, 25.0, 29.0, 19.0, 14.0, 17.0, 8.0, 15.0, 12.0, 10.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -3.9979248046875, -3.863037109375, -3.7281494140625, -3.59326171875, -3.4583740234375, -3.323486328125, -3.1885986328125, -3.0537109375, -2.9188232421875, -2.783935546875, -2.6490478515625, -2.51416015625, -2.3792724609375, -2.244384765625, -2.1094970703125, -1.974609375, -1.8397216796875, -1.704833984375, -1.5699462890625, -1.43505859375, -1.3001708984375, -1.165283203125, -1.0303955078125, -0.8955078125, -0.7606201171875, -0.625732421875, -0.4908447265625, -0.35595703125, -0.2210693359375, -0.086181640625, 0.0487060546875, 0.18359375, 0.3184814453125, 0.453369140625, 0.5882568359375, 0.72314453125, 0.8580322265625, 0.992919921875, 1.1278076171875, 1.2626953125, 1.3975830078125, 1.532470703125, 1.6673583984375, 1.80224609375, 1.9371337890625, 2.072021484375, 2.2069091796875, 2.341796875, 2.4766845703125, 2.611572265625, 2.7464599609375, 2.88134765625, 3.0162353515625, 3.151123046875, 3.2860107421875, 3.4208984375, 3.5557861328125, 3.690673828125, 3.8255615234375, 3.96044921875, 4.0953369140625, 4.230224609375, 4.3651123046875, 4.5]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 11.0, 12.0, 14.0, 23.0, 29.0, 28.0, 35.0, 56.0, 68.0, 87.0, 104.0, 166.0, 212.0, 311.0, 498.0, 1098.0, 5178.0, 79619.0, 1155950.0, 2472550.0, 449604.0, 23942.0, 2449.0, 768.0, 430.0, 261.0, 186.0, 143.0, 86.0, 78.0, 58.0, 62.0, 29.0, 32.0, 24.0, 20.0, 15.0, 9.0, 8.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.171875, -7.9107666015625, -7.649658203125, -7.3885498046875, -7.12744140625, -6.8663330078125, -6.605224609375, -6.3441162109375, -6.0830078125, -5.8218994140625, -5.560791015625, -5.2996826171875, -5.03857421875, -4.7774658203125, -4.516357421875, -4.2552490234375, -3.994140625, -3.7330322265625, -3.471923828125, -3.2108154296875, -2.94970703125, -2.6885986328125, -2.427490234375, -2.1663818359375, -1.9052734375, -1.6441650390625, -1.383056640625, -1.1219482421875, -0.86083984375, -0.5997314453125, -0.338623046875, -0.0775146484375, 0.18359375, 0.4447021484375, 0.705810546875, 0.9669189453125, 1.22802734375, 1.4891357421875, 1.750244140625, 2.0113525390625, 2.2724609375, 2.5335693359375, 2.794677734375, 3.0557861328125, 3.31689453125, 3.5780029296875, 3.839111328125, 4.1002197265625, 4.361328125, 4.6224365234375, 4.883544921875, 5.1446533203125, 5.40576171875, 5.6668701171875, 5.927978515625, 6.1890869140625, 6.4501953125, 6.7113037109375, 6.972412109375, 7.2335205078125, 7.49462890625, 7.7557373046875, 8.016845703125, 8.2779541015625, 8.5390625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 7.0, 5.0, 6.0, 12.0, 12.0, 30.0, 35.0, 47.0, 57.0, 80.0, 111.0, 148.0, 217.0, 273.0, 351.0, 418.0, 436.0, 387.0, 399.0, 281.0, 202.0, 153.0, 106.0, 75.0, 45.0, 48.0, 31.0, 26.0, 22.0, 10.0, 7.0, 5.0, 7.0, 2.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.2890625, -6.1016845703125, -5.914306640625, -5.7269287109375, -5.53955078125, -5.3521728515625, -5.164794921875, -4.9774169921875, -4.7900390625, -4.6026611328125, -4.415283203125, -4.2279052734375, -4.04052734375, -3.8531494140625, -3.665771484375, -3.4783935546875, -3.291015625, -3.1036376953125, -2.916259765625, -2.7288818359375, -2.54150390625, -2.3541259765625, -2.166748046875, -1.9793701171875, -1.7919921875, -1.6046142578125, -1.417236328125, -1.2298583984375, -1.04248046875, -0.8551025390625, -0.667724609375, -0.4803466796875, -0.29296875, -0.1055908203125, 0.081787109375, 0.2691650390625, 0.45654296875, 0.6439208984375, 0.831298828125, 1.0186767578125, 1.2060546875, 1.3934326171875, 1.580810546875, 1.7681884765625, 1.95556640625, 2.1429443359375, 2.330322265625, 2.5177001953125, 2.705078125, 2.8924560546875, 3.079833984375, 3.2672119140625, 3.45458984375, 3.6419677734375, 3.829345703125, 4.0167236328125, 4.2041015625, 4.3914794921875, 4.578857421875, 4.7662353515625, 4.95361328125, 5.1409912109375, 5.328369140625, 5.5157470703125, 5.703125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 6.0, 7.0, 7.0, 11.0, 15.0, 20.0, 36.0, 44.0, 64.0, 84.0, 109.0, 175.0, 284.0, 469.0, 784.0, 1983.0, 9690.0, 201338.0, 3544626.0, 414776.0, 14974.0, 2391.0, 880.0, 474.0, 325.0, 190.0, 141.0, 95.0, 83.0, 45.0, 33.0, 30.0, 29.0, 12.0, 10.0, 7.0, 11.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.8046875, -14.3360595703125, -13.867431640625, -13.3988037109375, -12.93017578125, -12.4615478515625, -11.992919921875, -11.5242919921875, -11.0556640625, -10.5870361328125, -10.118408203125, -9.6497802734375, -9.18115234375, -8.7125244140625, -8.243896484375, -7.7752685546875, -7.306640625, -6.8380126953125, -6.369384765625, -5.9007568359375, -5.43212890625, -4.9635009765625, -4.494873046875, -4.0262451171875, -3.5576171875, -3.0889892578125, -2.620361328125, -2.1517333984375, -1.68310546875, -1.2144775390625, -0.745849609375, -0.2772216796875, 0.19140625, 0.6600341796875, 1.128662109375, 1.5972900390625, 2.06591796875, 2.5345458984375, 3.003173828125, 3.4718017578125, 3.9404296875, 4.4090576171875, 4.877685546875, 5.3463134765625, 5.81494140625, 6.2835693359375, 6.752197265625, 7.2208251953125, 7.689453125, 8.1580810546875, 8.626708984375, 9.0953369140625, 9.56396484375, 10.0325927734375, 10.501220703125, 10.9698486328125, 11.4384765625, 11.9071044921875, 12.375732421875, 12.8443603515625, 13.31298828125, 13.7816162109375, 14.250244140625, 14.7188720703125, 15.1875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 298.0, 716.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-725.9168701171875, -710.8220825195312, -695.727294921875, -680.6325073242188, -665.5377197265625, -650.4429321289062, -635.34814453125, -620.2533569335938, -605.1585693359375, -590.0637817382812, -574.968994140625, -559.8742065429688, -544.7794189453125, -529.6846313476562, -514.58984375, -499.49505615234375, -484.4002380371094, -469.3054504394531, -454.2106628417969, -439.1158752441406, -424.0210876464844, -408.9263000488281, -393.83148193359375, -378.7366943359375, -363.64190673828125, -348.547119140625, -333.45233154296875, -318.3575439453125, -303.26275634765625, -288.16796875, -273.07318115234375, -257.9783935546875, -242.88357543945312, -227.78878784179688, -212.69400024414062, -197.59921264648438, -182.50442504882812, -167.40963745117188, -152.31483459472656, -137.2200469970703, -122.12525939941406, -107.03047180175781, -91.93568420410156, -76.84088897705078, -61.74610137939453, -46.65131378173828, -31.5565185546875, -16.46173095703125, -1.366943359375, 13.727846145629883, 28.822635650634766, 43.91742706298828, 59.01221466064453, 74.10700225830078, 89.20179748535156, 104.29658508300781, 119.39137268066406, 134.4861602783203, 149.58094787597656, 164.67575073242188, 179.77053833007812, 194.86532592773438, 209.96011352539062, 225.05490112304688, 240.14968872070312]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 17.0, 11.0, 18.0, 26.0, 29.0, 23.0, 42.0, 37.0, 36.0, 48.0, 56.0, 65.0, 68.0, 62.0, 46.0, 55.0, 56.0, 49.0, 46.0, 34.0, 36.0, 34.0, 26.0, 21.0, 16.0, 13.0, 7.0, 12.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.70359992980957, -19.747283935546875, -18.790969848632812, -17.834653854370117, -16.878337860107422, -15.922021865844727, -14.965706825256348, -14.009391784667969, -13.053075790405273, -12.096759796142578, -11.1404447555542, -10.18412971496582, -9.227813720703125, -8.27149772644043, -7.315182685852051, -6.358867168426514, -5.402551651000977, -4.4462361335754395, -3.4899206161499023, -2.5336050987243652, -1.5772895812988281, -0.620974063873291, 0.3353414535522461, 1.2916569709777832, 2.2479724884033203, 3.2042880058288574, 4.1606035232543945, 5.116919040679932, 6.073234558105469, 7.029550075531006, 7.985865592956543, 8.942180633544922, 9.89849853515625, 10.854814529418945, 11.811129570007324, 12.767444610595703, 13.723760604858398, 14.680076599121094, 15.636391639709473, 16.59270668029785, 17.549022674560547, 18.505338668823242, 19.461654663085938, 20.41796875, 21.374284744262695, 22.33060073852539, 23.286914825439453, 24.24323081970215, 25.199546813964844, 26.15586280822754, 27.112178802490234, 28.068492889404297, 29.024808883666992, 29.981124877929688, 30.93743896484375, 31.893754959106445, 32.85007095336914, 33.8063850402832, 34.76270294189453, 35.719017028808594, 36.675331115722656, 37.631649017333984, 38.58796310424805, 39.544281005859375, 40.50059509277344]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 8.0, 13.0, 13.0, 14.0, 12.0, 17.0, 20.0, 18.0, 20.0, 29.0, 34.0, 47.0, 35.0, 31.0, 39.0, 36.0, 46.0, 40.0, 38.0, 50.0, 54.0, 42.0, 37.0, 30.0, 44.0, 35.0, 23.0, 29.0, 23.0, 21.0, 15.0, 15.0, 14.0, 13.0, 10.0, 6.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.8138427734375, -3.678466796875, -3.5430908203125, -3.40771484375, -3.2723388671875, -3.136962890625, -3.0015869140625, -2.8662109375, -2.7308349609375, -2.595458984375, -2.4600830078125, -2.32470703125, -2.1893310546875, -2.053955078125, -1.9185791015625, -1.783203125, -1.6478271484375, -1.512451171875, -1.3770751953125, -1.24169921875, -1.1063232421875, -0.970947265625, -0.8355712890625, -0.7001953125, -0.5648193359375, -0.429443359375, -0.2940673828125, -0.15869140625, -0.0233154296875, 0.112060546875, 0.2474365234375, 0.3828125, 0.5181884765625, 0.653564453125, 0.7889404296875, 0.92431640625, 1.0596923828125, 1.195068359375, 1.3304443359375, 1.4658203125, 1.6011962890625, 1.736572265625, 1.8719482421875, 2.00732421875, 2.1427001953125, 2.278076171875, 2.4134521484375, 2.548828125, 2.6842041015625, 2.819580078125, 2.9549560546875, 3.09033203125, 3.2257080078125, 3.361083984375, 3.4964599609375, 3.6318359375, 3.7672119140625, 3.902587890625, 4.0379638671875, 4.17333984375, 4.3087158203125, 4.444091796875, 4.5794677734375, 4.71484375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 12.0, 8.0, 18.0, 26.0, 35.0, 57.0, 79.0, 114.0, 187.0, 290.0, 414.0, 590.0, 915.0, 1372.0, 2047.0, 3087.0, 4781.0, 7158.0, 11249.0, 17985.0, 29475.0, 49940.0, 89441.0, 179743.0, 298882.0, 154125.0, 79053.0, 44694.0, 26497.0, 16564.0, 10206.0, 6581.0, 4342.0, 2820.0, 1944.0, 1249.0, 832.0, 593.0, 375.0, 227.0, 180.0, 120.0, 75.0, 49.0, 39.0, 29.0, 19.0, 11.0, 9.0, 7.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.82958984375, -0.8054733276367188, -0.7813568115234375, -0.7572402954101562, -0.733123779296875, -0.7090072631835938, -0.6848907470703125, -0.6607742309570312, -0.63665771484375, -0.6125411987304688, -0.5884246826171875, -0.5643081665039062, -0.540191650390625, -0.5160751342773438, -0.4919586181640625, -0.46784210205078125, -0.4437255859375, -0.41960906982421875, -0.3954925537109375, -0.37137603759765625, -0.347259521484375, -0.32314300537109375, -0.2990264892578125, -0.27490997314453125, -0.25079345703125, -0.22667694091796875, -0.2025604248046875, -0.17844390869140625, -0.154327392578125, -0.13021087646484375, -0.1060943603515625, -0.08197784423828125, -0.057861328125, -0.03374481201171875, -0.0096282958984375, 0.01448822021484375, 0.038604736328125, 0.06272125244140625, 0.0868377685546875, 0.11095428466796875, 0.13507080078125, 0.15918731689453125, 0.1833038330078125, 0.20742034912109375, 0.231536865234375, 0.25565338134765625, 0.2797698974609375, 0.30388641357421875, 0.3280029296875, 0.35211944580078125, 0.3762359619140625, 0.40035247802734375, 0.424468994140625, 0.44858551025390625, 0.4727020263671875, 0.49681854248046875, 0.52093505859375, 0.5450515747070312, 0.5691680908203125, 0.5932846069335938, 0.617401123046875, 0.6415176391601562, 0.6656341552734375, 0.6897506713867188, 0.7138671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 6.0, 4.0, 13.0, 12.0, 14.0, 14.0, 6.0, 19.0, 14.0, 18.0, 32.0, 31.0, 28.0, 29.0, 44.0, 41.0, 28.0, 35.0, 41.0, 36.0, 1060.0, 51.0, 43.0, 38.0, 36.0, 34.0, 35.0, 37.0, 25.0, 32.0, 22.0, 14.0, 13.0, 15.0, 13.0, 13.0, 11.0, 17.0, 7.0, 7.0, 8.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.455078125, -2.374176025390625, -2.29327392578125, -2.212371826171875, -2.1314697265625, -2.050567626953125, -1.96966552734375, -1.888763427734375, -1.807861328125, -1.726959228515625, -1.64605712890625, -1.565155029296875, -1.4842529296875, -1.403350830078125, -1.32244873046875, -1.241546630859375, -1.16064453125, -1.079742431640625, -0.99884033203125, -0.917938232421875, -0.8370361328125, -0.756134033203125, -0.67523193359375, -0.594329833984375, -0.513427734375, -0.432525634765625, -0.35162353515625, -0.270721435546875, -0.1898193359375, -0.108917236328125, -0.02801513671875, 0.052886962890625, 0.1337890625, 0.214691162109375, 0.29559326171875, 0.376495361328125, 0.4573974609375, 0.538299560546875, 0.61920166015625, 0.700103759765625, 0.781005859375, 0.861907958984375, 0.94281005859375, 1.023712158203125, 1.1046142578125, 1.185516357421875, 1.26641845703125, 1.347320556640625, 1.42822265625, 1.509124755859375, 1.59002685546875, 1.670928955078125, 1.7518310546875, 1.832733154296875, 1.91363525390625, 1.994537353515625, 2.075439453125, 2.156341552734375, 2.23724365234375, 2.318145751953125, 2.3990478515625, 2.479949951171875, 2.56085205078125, 2.641754150390625, 2.72265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 8.0, 6.0, 13.0, 16.0, 32.0, 45.0, 56.0, 91.0, 125.0, 195.0, 281.0, 416.0, 547.0, 822.0, 1167.0, 1771.0, 2484.0, 3607.0, 5179.0, 7815.0, 11739.0, 18111.0, 28713.0, 47456.0, 83202.0, 159637.0, 1352769.0, 158230.0, 82793.0, 46882.0, 28580.0, 18002.0, 11600.0, 7689.0, 5158.0, 3730.0, 2492.0, 1848.0, 1242.0, 805.0, 566.0, 424.0, 255.0, 196.0, 119.0, 69.0, 54.0, 48.0, 18.0, 11.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68701171875, -0.6644821166992188, -0.6419525146484375, -0.6194229125976562, -0.596893310546875, -0.5743637084960938, -0.5518341064453125, -0.5293045043945312, -0.50677490234375, -0.48424530029296875, -0.4617156982421875, -0.43918609619140625, -0.416656494140625, -0.39412689208984375, -0.3715972900390625, -0.34906768798828125, -0.3265380859375, -0.30400848388671875, -0.2814788818359375, -0.25894927978515625, -0.236419677734375, -0.21389007568359375, -0.1913604736328125, -0.16883087158203125, -0.14630126953125, -0.12377166748046875, -0.1012420654296875, -0.07871246337890625, -0.056182861328125, -0.03365325927734375, -0.0111236572265625, 0.01140594482421875, 0.033935546875, 0.05646514892578125, 0.0789947509765625, 0.10152435302734375, 0.124053955078125, 0.14658355712890625, 0.1691131591796875, 0.19164276123046875, 0.21417236328125, 0.23670196533203125, 0.2592315673828125, 0.28176116943359375, 0.304290771484375, 0.32682037353515625, 0.3493499755859375, 0.37187957763671875, 0.3944091796875, 0.41693878173828125, 0.4394683837890625, 0.46199798583984375, 0.484527587890625, 0.5070571899414062, 0.5295867919921875, 0.5521163940429688, 0.57464599609375, 0.5971755981445312, 0.6197052001953125, 0.6422348022460938, 0.664764404296875, 0.6872940063476562, 0.7098236083984375, 0.7323532104492188, 0.7548828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 12.0, 10.0, 9.0, 10.0, 12.0, 15.0, 18.0, 16.0, 31.0, 22.0, 32.0, 29.0, 33.0, 46.0, 44.0, 52.0, 48.0, 52.0, 54.0, 52.0, 39.0, 49.0, 38.0, 35.0, 35.0, 35.0, 18.0, 26.0, 25.0, 11.0, 17.0, 7.0, 17.0, 4.0, 6.0, 9.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00043773651123046875, -0.0004251226782798767, -0.00041250884532928467, -0.0003998950123786926, -0.0003872811794281006, -0.00037466734647750854, -0.0003620535135269165, -0.00034943968057632446, -0.0003368258476257324, -0.0003242120146751404, -0.00031159818172454834, -0.0002989843487739563, -0.00028637051582336426, -0.0002737566828727722, -0.0002611428499221802, -0.00024852901697158813, -0.0002359151840209961, -0.00022330135107040405, -0.000210687518119812, -0.00019807368516921997, -0.00018545985221862793, -0.0001728460192680359, -0.00016023218631744385, -0.0001476183533668518, -0.00013500452041625977, -0.00012239068746566772, -0.00010977685451507568, -9.716302156448364e-05, -8.45491886138916e-05, -7.193535566329956e-05, -5.932152271270752e-05, -4.670768976211548e-05, -3.409385681152344e-05, -2.1480023860931396e-05, -8.866190910339355e-06, 3.7476420402526855e-06, 1.6361474990844727e-05, 2.8975307941436768e-05, 4.158914089202881e-05, 5.420297384262085e-05, 6.681680679321289e-05, 7.943063974380493e-05, 9.204447269439697e-05, 0.00010465830564498901, 0.00011727213859558105, 0.0001298859715461731, 0.00014249980449676514, 0.00015511363744735718, 0.00016772747039794922, 0.00018034130334854126, 0.0001929551362991333, 0.00020556896924972534, 0.00021818280220031738, 0.00023079663515090942, 0.00024341046810150146, 0.0002560243010520935, 0.00026863813400268555, 0.0002812519669532776, 0.00029386579990386963, 0.00030647963285446167, 0.0003190934658050537, 0.00033170729875564575, 0.0003443211317062378, 0.00035693496465682983, 0.0003695487976074219]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 12.0, 14.0, 8.0, 8.0, 23.0, 23.0, 27.0, 27.0, 36.0, 39.0, 55.0, 73.0, 84.0, 131.0, 179.0, 228.0, 418.0, 700.0, 2545.0, 970600.0, 70479.0, 1149.0, 527.0, 342.0, 193.0, 138.0, 94.0, 71.0, 60.0, 48.0, 36.0, 40.0, 25.0, 29.0, 17.0, 21.0, 9.0, 4.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.007114410400390625, -0.006867110729217529, -0.006619811058044434, -0.006372511386871338, -0.006125211715698242, -0.0058779120445251465, -0.005630612373352051, -0.005383312702178955, -0.005136013031005859, -0.004888713359832764, -0.004641413688659668, -0.004394114017486572, -0.0041468143463134766, -0.003899514675140381, -0.003652215003967285, -0.0034049153327941895, -0.0031576156616210938, -0.002910315990447998, -0.0026630163192749023, -0.0024157166481018066, -0.002168416976928711, -0.0019211173057556152, -0.0016738176345825195, -0.0014265179634094238, -0.0011792182922363281, -0.0009319186210632324, -0.0006846189498901367, -0.000437319278717041, -0.0001900196075439453, 5.728006362915039e-05, 0.0003045797348022461, 0.0005518794059753418, 0.0007991790771484375, 0.0010464787483215332, 0.001293778419494629, 0.0015410780906677246, 0.0017883777618408203, 0.002035677433013916, 0.0022829771041870117, 0.0025302767753601074, 0.002777576446533203, 0.003024876117706299, 0.0032721757888793945, 0.0035194754600524902, 0.003766775131225586, 0.004014074802398682, 0.004261374473571777, 0.004508674144744873, 0.004755973815917969, 0.0050032734870910645, 0.00525057315826416, 0.005497872829437256, 0.0057451725006103516, 0.005992472171783447, 0.006239771842956543, 0.006487071514129639, 0.006734371185302734, 0.00698167085647583, 0.007228970527648926, 0.0074762701988220215, 0.007723569869995117, 0.007970869541168213, 0.008218169212341309, 0.008465468883514404, 0.0087127685546875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 31.0, 435.0, 511.0, 37.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.002659361809492111, -0.002613550052046776, -0.002567738527432084, -0.0025219267699867487, -0.002476115245372057, -0.0024303034879267216, -0.00238449196331203, -0.0023386802058666945, -0.0022928686812520027, -0.0022470569238066673, -0.0022012453991919756, -0.00215543364174664, -0.0021096221171319485, -0.002063810359686613, -0.0020179988350719213, -0.001972187077626586, -0.0019263753201812506, -0.001880563679151237, -0.0018347520381212234, -0.0017889403970912099, -0.0017431287560611963, -0.001697316998615861, -0.0016515054740011692, -0.0016056937165558338, -0.001559882191941142, -0.0015140705509111285, -0.001468258909881115, -0.0014224472688511014, -0.0013766356278210878, -0.0013308238703757524, -0.0012850123457610607, -0.0012392005883157253, -0.00119338883087039, -0.0011475771898403764, -0.0011017655488103628, -0.0010559539077803493, -0.0010101422667503357, -0.0009643305675126612, -0.0009185189264826477, -0.0008727072272449732, -0.0008268957026302814, -0.0007810840616002679, -0.0007352724205702543, -0.0006894607795402408, -0.0006436490803025663, -0.0005978374392725527, -0.0005520257982425392, -0.0005062140990048647, -0.00046040245797485113, -0.00041459081694483757, -0.00036877914681099355, -0.00032296750578098, -0.000277155835647136, -0.0002313441946171224, -0.00018553255358710885, -0.00013972088345326483, -9.390924242325127e-05, -4.809759047930129e-05, -2.285938535351306e-06, 4.352570977061987e-05, 8.933736535254866e-05, 0.00013514902093447745, 0.000180960661964491, 0.00022677233209833503, 0.0002725839731283486]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 5.0, 11.0, 7.0, 5.0, 17.0, 22.0, 16.0, 25.0, 16.0, 23.0, 24.0, 37.0, 33.0, 33.0, 41.0, 61.0, 36.0, 37.0, 51.0, 38.0, 50.0, 54.0, 48.0, 34.0, 32.0, 28.0, 35.0, 31.0, 23.0, 15.0, 22.0, 15.0, 14.0, 9.0, 7.0, 7.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022673606872558594, -0.00021886080503463745, -0.00021098554134368896, -0.00020311027765274048, -0.000195235013961792, -0.0001873597502708435, -0.00017948448657989502, -0.00017160922288894653, -0.00016373395919799805, -0.00015585869550704956, -0.00014798343181610107, -0.0001401081681251526, -0.0001322329044342041, -0.00012435764074325562, -0.00011648237705230713, -0.00010860711336135864, -0.00010073184967041016, -9.285658597946167e-05, -8.498132228851318e-05, -7.71060585975647e-05, -6.923079490661621e-05, -6.135553121566772e-05, -5.348026752471924e-05, -4.560500383377075e-05, -3.7729740142822266e-05, -2.985447645187378e-05, -2.1979212760925293e-05, -1.4103949069976807e-05, -6.22868537902832e-06, 1.646578311920166e-06, 9.521842002868652e-06, 1.739710569381714e-05, 2.5272369384765625e-05, 3.314763307571411e-05, 4.10228967666626e-05, 4.8898160457611084e-05, 5.677342414855957e-05, 6.464868783950806e-05, 7.252395153045654e-05, 8.039921522140503e-05, 8.827447891235352e-05, 9.6149742603302e-05, 0.00010402500629425049, 0.00011190026998519897, 0.00011977553367614746, 0.00012765079736709595, 0.00013552606105804443, 0.00014340132474899292, 0.0001512765884399414, 0.0001591518521308899, 0.00016702711582183838, 0.00017490237951278687, 0.00018277764320373535, 0.00019065290689468384, 0.00019852817058563232, 0.0002064034342765808, 0.0002142786979675293, 0.00022215396165847778, 0.00023002922534942627, 0.00023790448904037476, 0.00024577975273132324, 0.00025365501642227173, 0.0002615302801132202, 0.0002694055438041687, 0.0002772808074951172]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 8.0, 13.0, 13.0, 14.0, 12.0, 17.0, 20.0, 18.0, 20.0, 29.0, 34.0, 47.0, 35.0, 31.0, 39.0, 36.0, 46.0, 40.0, 38.0, 50.0, 54.0, 42.0, 37.0, 30.0, 43.0, 36.0, 23.0, 29.0, 23.0, 21.0, 15.0, 15.0, 14.0, 13.0, 10.0, 6.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.8138427734375, -3.678466796875, -3.5430908203125, -3.40771484375, -3.2723388671875, -3.136962890625, -3.0015869140625, -2.8662109375, -2.7308349609375, -2.595458984375, -2.4600830078125, -2.32470703125, -2.1893310546875, -2.053955078125, -1.9185791015625, -1.783203125, -1.6478271484375, -1.512451171875, -1.3770751953125, -1.24169921875, -1.1063232421875, -0.970947265625, -0.8355712890625, -0.7001953125, -0.5648193359375, -0.429443359375, -0.2940673828125, -0.15869140625, -0.0233154296875, 0.112060546875, 0.2474365234375, 0.3828125, 0.5181884765625, 0.653564453125, 0.7889404296875, 0.92431640625, 1.0596923828125, 1.195068359375, 1.3304443359375, 1.4658203125, 1.6011962890625, 1.736572265625, 1.8719482421875, 2.00732421875, 2.1427001953125, 2.278076171875, 2.4134521484375, 2.548828125, 2.6842041015625, 2.819580078125, 2.9549560546875, 3.09033203125, 3.2257080078125, 3.361083984375, 3.4964599609375, 3.6318359375, 3.7672119140625, 3.902587890625, 4.0379638671875, 4.17333984375, 4.3087158203125, 4.444091796875, 4.5794677734375, 4.71484375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 15.0, 10.0, 15.0, 23.0, 48.0, 40.0, 57.0, 75.0, 99.0, 120.0, 169.0, 290.0, 421.0, 893.0, 1683.0, 3709.0, 9712.0, 28017.0, 83446.0, 264314.0, 415483.0, 159047.0, 51508.0, 17206.0, 6406.0, 2625.0, 1260.0, 609.0, 389.0, 225.0, 174.0, 103.0, 91.0, 60.0, 52.0, 40.0, 27.0, 29.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6484375, -4.48406982421875, -4.3197021484375, -4.15533447265625, -3.990966796875, -3.82659912109375, -3.6622314453125, -3.49786376953125, -3.33349609375, -3.16912841796875, -3.0047607421875, -2.84039306640625, -2.676025390625, -2.51165771484375, -2.3472900390625, -2.18292236328125, -2.0185546875, -1.85418701171875, -1.6898193359375, -1.52545166015625, -1.361083984375, -1.19671630859375, -1.0323486328125, -0.86798095703125, -0.70361328125, -0.53924560546875, -0.3748779296875, -0.21051025390625, -0.046142578125, 0.11822509765625, 0.2825927734375, 0.44696044921875, 0.611328125, 0.77569580078125, 0.9400634765625, 1.10443115234375, 1.268798828125, 1.43316650390625, 1.5975341796875, 1.76190185546875, 1.92626953125, 2.09063720703125, 2.2550048828125, 2.41937255859375, 2.583740234375, 2.74810791015625, 2.9124755859375, 3.07684326171875, 3.2412109375, 3.40557861328125, 3.5699462890625, 3.73431396484375, 3.898681640625, 4.06304931640625, 4.2274169921875, 4.39178466796875, 4.55615234375, 4.72052001953125, 4.8848876953125, 5.04925537109375, 5.213623046875, 5.37799072265625, 5.5423583984375, 5.70672607421875, 5.87109375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 9.0, 6.0, 6.0, 16.0, 23.0, 13.0, 20.0, 15.0, 26.0, 30.0, 31.0, 35.0, 30.0, 41.0, 43.0, 71.0, 105.0, 254.0, 1463.0, 230.0, 125.0, 82.0, 55.0, 45.0, 29.0, 32.0, 24.0, 32.0, 28.0, 22.0, 19.0, 19.0, 7.0, 6.0, 9.0, 7.0, 3.0, 6.0, 5.0, 8.0, 2.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0], "bins": [-13.9453125, -13.552490234375, -13.15966796875, -12.766845703125, -12.3740234375, -11.981201171875, -11.58837890625, -11.195556640625, -10.802734375, -10.409912109375, -10.01708984375, -9.624267578125, -9.2314453125, -8.838623046875, -8.44580078125, -8.052978515625, -7.66015625, -7.267333984375, -6.87451171875, -6.481689453125, -6.0888671875, -5.696044921875, -5.30322265625, -4.910400390625, -4.517578125, -4.124755859375, -3.73193359375, -3.339111328125, -2.9462890625, -2.553466796875, -2.16064453125, -1.767822265625, -1.375, -0.982177734375, -0.58935546875, -0.196533203125, 0.1962890625, 0.589111328125, 0.98193359375, 1.374755859375, 1.767578125, 2.160400390625, 2.55322265625, 2.946044921875, 3.3388671875, 3.731689453125, 4.12451171875, 4.517333984375, 4.91015625, 5.302978515625, 5.69580078125, 6.088623046875, 6.4814453125, 6.874267578125, 7.26708984375, 7.659912109375, 8.052734375, 8.445556640625, 8.83837890625, 9.231201171875, 9.6240234375, 10.016845703125, 10.40966796875, 10.802490234375, 11.1953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 7.0, 4.0, 12.0, 10.0, 13.0, 21.0, 22.0, 44.0, 56.0, 67.0, 101.0, 145.0, 240.0, 353.0, 608.0, 1188.0, 9514.0, 2306540.0, 818212.0, 5825.0, 1095.0, 563.0, 341.0, 223.0, 134.0, 91.0, 68.0, 60.0, 27.0, 22.0, 13.0, 15.0, 18.0, 6.0, 7.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.765625, -23.989990234375, -23.21435546875, -22.438720703125, -21.6630859375, -20.887451171875, -20.11181640625, -19.336181640625, -18.560546875, -17.784912109375, -17.00927734375, -16.233642578125, -15.4580078125, -14.682373046875, -13.90673828125, -13.131103515625, -12.35546875, -11.579833984375, -10.80419921875, -10.028564453125, -9.2529296875, -8.477294921875, -7.70166015625, -6.926025390625, -6.150390625, -5.374755859375, -4.59912109375, -3.823486328125, -3.0478515625, -2.272216796875, -1.49658203125, -0.720947265625, 0.0546875, 0.830322265625, 1.60595703125, 2.381591796875, 3.1572265625, 3.932861328125, 4.70849609375, 5.484130859375, 6.259765625, 7.035400390625, 7.81103515625, 8.586669921875, 9.3623046875, 10.137939453125, 10.91357421875, 11.689208984375, 12.46484375, 13.240478515625, 14.01611328125, 14.791748046875, 15.5673828125, 16.343017578125, 17.11865234375, 17.894287109375, 18.669921875, 19.445556640625, 20.22119140625, 20.996826171875, 21.7724609375, 22.548095703125, 23.32373046875, 24.099365234375, 24.875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 680.0, 331.0, 0.0, 0.0, 1.0], "bins": [-405.9640197753906, -399.18408203125, -392.4041442871094, -385.62420654296875, -378.84423828125, -372.0643005371094, -365.28436279296875, -358.5044250488281, -351.7244873046875, -344.9445495605469, -338.16461181640625, -331.3846435546875, -324.6047058105469, -317.82476806640625, -311.0448303222656, -304.264892578125, -297.48492431640625, -290.7049865722656, -283.925048828125, -277.14508056640625, -270.3651428222656, -263.585205078125, -256.8052673339844, -250.02532958984375, -243.24539184570312, -236.4654541015625, -229.6855010986328, -222.9055633544922, -216.12562561035156, -209.34567260742188, -202.56573486328125, -195.78579711914062, -189.005859375, -182.22592163085938, -175.4459686279297, -168.66603088378906, -161.88609313964844, -155.10614013671875, -148.32620239257812, -141.5462646484375, -134.7663116455078, -127.98636627197266, -121.20642852783203, -114.42648315429688, -107.64654541015625, -100.8666000366211, -94.08665466308594, -87.30671691894531, -80.52677154541016, -73.746826171875, -66.96688842773438, -60.18694305419922, -53.40700149536133, -46.62705993652344, -39.84711456298828, -33.06717300415039, -26.287233352661133, -19.50728988647461, -12.727348327636719, -5.947404861450195, 0.8325366973876953, 7.612478256225586, 14.392423629760742, 21.172365188598633, 27.952306747436523]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 12.0, 12.0, 12.0, 13.0, 16.0, 29.0, 17.0, 27.0, 26.0, 27.0, 34.0, 43.0, 50.0, 39.0, 37.0, 47.0, 47.0, 47.0, 45.0, 40.0, 37.0, 43.0, 32.0, 40.0, 38.0, 22.0, 27.0, 25.0, 19.0, 16.0, 15.0, 15.0, 9.0, 5.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.35944366455078, -23.451749801635742, -22.544055938720703, -21.63636016845703, -20.728666305541992, -19.820972442626953, -18.913278579711914, -18.005584716796875, -17.097890853881836, -16.190196990966797, -15.282502174377441, -14.374808311462402, -13.467114448547363, -12.559419631958008, -11.651725769042969, -10.74403190612793, -9.836337089538574, -8.928643226623535, -8.02094841003418, -7.113254547119141, -6.205560684204102, -5.297866344451904, -4.390172004699707, -3.482478141784668, -2.5747838020324707, -1.6670897006988525, -0.7593954801559448, 0.1482987403869629, 1.055992841720581, 1.9636869430541992, 2.8713812828063965, 3.7790751457214355, 4.686769485473633, 5.59446382522583, 6.502157688140869, 7.409852027893066, 8.317545890808105, 9.225240707397461, 10.1329345703125, 11.040628433227539, 11.948322296142578, 12.856016159057617, 13.763710975646973, 14.671404838562012, 15.57909870147705, 16.486793518066406, 17.394487380981445, 18.302181243896484, 19.209877014160156, 20.117570877075195, 21.025264739990234, 21.932960510253906, 22.840654373168945, 23.748348236083984, 24.656042098999023, 25.563735961914062, 26.4714298248291, 27.37912368774414, 28.28681755065918, 29.19451141357422, 30.10220718383789, 31.00990104675293, 31.91759490966797, 32.825286865234375, 33.73298263549805]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 9.0, 14.0, 5.0, 7.0, 8.0, 14.0, 18.0, 23.0, 21.0, 24.0, 20.0, 24.0, 33.0, 28.0, 33.0, 29.0, 38.0, 37.0, 37.0, 48.0, 47.0, 40.0, 48.0, 43.0, 35.0, 35.0, 36.0, 26.0, 26.0, 26.0, 23.0, 32.0, 8.0, 24.0, 17.0, 12.0, 6.0, 12.0, 8.0, 3.0, 7.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.748046875, -3.620086669921875, -3.49212646484375, -3.364166259765625, -3.2362060546875, -3.108245849609375, -2.98028564453125, -2.852325439453125, -2.724365234375, -2.596405029296875, -2.46844482421875, -2.340484619140625, -2.2125244140625, -2.084564208984375, -1.95660400390625, -1.828643798828125, -1.70068359375, -1.572723388671875, -1.44476318359375, -1.316802978515625, -1.1888427734375, -1.060882568359375, -0.93292236328125, -0.804962158203125, -0.677001953125, -0.549041748046875, -0.42108154296875, -0.293121337890625, -0.1651611328125, -0.037200927734375, 0.09075927734375, 0.218719482421875, 0.3466796875, 0.474639892578125, 0.60260009765625, 0.730560302734375, 0.8585205078125, 0.986480712890625, 1.11444091796875, 1.242401123046875, 1.370361328125, 1.498321533203125, 1.62628173828125, 1.754241943359375, 1.8822021484375, 2.010162353515625, 2.13812255859375, 2.266082763671875, 2.39404296875, 2.522003173828125, 2.64996337890625, 2.777923583984375, 2.9058837890625, 3.033843994140625, 3.16180419921875, 3.289764404296875, 3.417724609375, 3.545684814453125, 3.67364501953125, 3.801605224609375, 3.9295654296875, 4.057525634765625, 4.18548583984375, 4.313446044921875, 4.44140625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 8.0, 5.0, 6.0, 5.0, 8.0, 8.0, 9.0, 9.0, 19.0, 25.0, 36.0, 23.0, 40.0, 69.0, 80.0, 129.0, 206.0, 360.0, 563.0, 1405.0, 4516.0, 20905.0, 122263.0, 625253.0, 1673659.0, 1301606.0, 363675.0, 63353.0, 10911.0, 2817.0, 1002.0, 481.0, 229.0, 171.0, 89.0, 73.0, 64.0, 49.0, 28.0, 29.0, 24.0, 15.0, 8.0, 17.0, 5.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44140625, -4.28173828125, -4.1220703125, -3.96240234375, -3.802734375, -3.64306640625, -3.4833984375, -3.32373046875, -3.1640625, -3.00439453125, -2.8447265625, -2.68505859375, -2.525390625, -2.36572265625, -2.2060546875, -2.04638671875, -1.88671875, -1.72705078125, -1.5673828125, -1.40771484375, -1.248046875, -1.08837890625, -0.9287109375, -0.76904296875, -0.609375, -0.44970703125, -0.2900390625, -0.13037109375, 0.029296875, 0.18896484375, 0.3486328125, 0.50830078125, 0.66796875, 0.82763671875, 0.9873046875, 1.14697265625, 1.306640625, 1.46630859375, 1.6259765625, 1.78564453125, 1.9453125, 2.10498046875, 2.2646484375, 2.42431640625, 2.583984375, 2.74365234375, 2.9033203125, 3.06298828125, 3.22265625, 3.38232421875, 3.5419921875, 3.70166015625, 3.861328125, 4.02099609375, 4.1806640625, 4.34033203125, 4.5, 4.65966796875, 4.8193359375, 4.97900390625, 5.138671875, 5.29833984375, 5.4580078125, 5.61767578125, 5.77734375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 9.0, 14.0, 10.0, 21.0, 27.0, 30.0, 43.0, 54.0, 77.0, 129.0, 170.0, 241.0, 324.0, 429.0, 461.0, 450.0, 391.0, 311.0, 245.0, 171.0, 116.0, 75.0, 55.0, 47.0, 46.0, 29.0, 19.0, 18.0, 12.0, 8.0, 7.0, 6.0, 7.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.1953125, -5.0218505859375, -4.848388671875, -4.6749267578125, -4.50146484375, -4.3280029296875, -4.154541015625, -3.9810791015625, -3.8076171875, -3.6341552734375, -3.460693359375, -3.2872314453125, -3.11376953125, -2.9403076171875, -2.766845703125, -2.5933837890625, -2.419921875, -2.2464599609375, -2.072998046875, -1.8995361328125, -1.72607421875, -1.5526123046875, -1.379150390625, -1.2056884765625, -1.0322265625, -0.8587646484375, -0.685302734375, -0.5118408203125, -0.33837890625, -0.1649169921875, 0.008544921875, 0.1820068359375, 0.35546875, 0.5289306640625, 0.702392578125, 0.8758544921875, 1.04931640625, 1.2227783203125, 1.396240234375, 1.5697021484375, 1.7431640625, 1.9166259765625, 2.090087890625, 2.2635498046875, 2.43701171875, 2.6104736328125, 2.783935546875, 2.9573974609375, 3.130859375, 3.3043212890625, 3.477783203125, 3.6512451171875, 3.82470703125, 3.9981689453125, 4.171630859375, 4.3450927734375, 4.5185546875, 4.6920166015625, 4.865478515625, 5.0389404296875, 5.21240234375, 5.3858642578125, 5.559326171875, 5.7327880859375, 5.90625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 10.0, 4.0, 7.0, 15.0, 14.0, 16.0, 27.0, 47.0, 43.0, 61.0, 93.0, 153.0, 229.0, 431.0, 889.0, 2595.0, 11772.0, 82810.0, 1055865.0, 2727464.0, 273268.0, 29895.0, 5487.0, 1616.0, 612.0, 293.0, 190.0, 125.0, 63.0, 47.0, 36.0, 37.0, 16.0, 11.0, 18.0, 5.0, 7.0, 5.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.40625, -7.1129150390625, -6.819580078125, -6.5262451171875, -6.23291015625, -5.9395751953125, -5.646240234375, -5.3529052734375, -5.0595703125, -4.7662353515625, -4.472900390625, -4.1795654296875, -3.88623046875, -3.5928955078125, -3.299560546875, -3.0062255859375, -2.712890625, -2.4195556640625, -2.126220703125, -1.8328857421875, -1.53955078125, -1.2462158203125, -0.952880859375, -0.6595458984375, -0.3662109375, -0.0728759765625, 0.220458984375, 0.5137939453125, 0.80712890625, 1.1004638671875, 1.393798828125, 1.6871337890625, 1.98046875, 2.2738037109375, 2.567138671875, 2.8604736328125, 3.15380859375, 3.4471435546875, 3.740478515625, 4.0338134765625, 4.3271484375, 4.6204833984375, 4.913818359375, 5.2071533203125, 5.50048828125, 5.7938232421875, 6.087158203125, 6.3804931640625, 6.673828125, 6.9671630859375, 7.260498046875, 7.5538330078125, 7.84716796875, 8.1405029296875, 8.433837890625, 8.7271728515625, 9.0205078125, 9.3138427734375, 9.607177734375, 9.9005126953125, 10.19384765625, 10.4871826171875, 10.780517578125, 11.0738525390625, 11.3671875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 12.0, 89.0, 265.0, 371.0, 221.0, 41.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.562997817993164, -20.562423706054688, -18.56184959411621, -16.561275482177734, -14.560702323913574, -12.560128211975098, -10.559555053710938, -8.558980941772461, -6.558406829833984, -4.557832717895508, -2.5572590827941895, -0.5566854476928711, 1.4438886642456055, 3.444462776184082, 5.445035934448242, 7.445610046386719, 9.446184158325195, 11.446758270263672, 13.447332382202148, 15.447905540466309, 17.44847869873047, 19.449054718017578, 21.449626922607422, 23.4502010345459, 25.450775146484375, 27.45134925842285, 29.451923370361328, 31.452495574951172, 33.45307159423828, 35.453643798828125, 37.45421600341797, 39.45479202270508, 41.45536804199219, 43.45594024658203, 45.45651626586914, 47.457088470458984, 49.457664489746094, 51.45823669433594, 53.45880889892578, 55.45938491821289, 57.4599609375, 59.460533142089844, 61.46110916137695, 63.4616813659668, 65.4622573852539, 67.46282958984375, 69.4634017944336, 71.46397399902344, 73.46455383300781, 75.46512603759766, 77.4656982421875, 79.46627807617188, 81.46685028076172, 83.46742248535156, 85.4679946899414, 87.46856689453125, 89.4691390991211, 91.46971130371094, 93.47028350830078, 95.47086334228516, 97.471435546875, 99.47200775146484, 101.47257995605469, 103.47315979003906, 105.4737319946289]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 6.0, 10.0, 16.0, 9.0, 18.0, 13.0, 24.0, 21.0, 24.0, 34.0, 35.0, 32.0, 29.0, 40.0, 41.0, 41.0, 38.0, 47.0, 33.0, 40.0, 29.0, 42.0, 40.0, 49.0, 32.0, 22.0, 35.0, 29.0, 26.0, 19.0, 20.0, 20.0, 15.0, 8.0, 7.0, 10.0, 9.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.538654327392578, -19.92561149597168, -19.31256866455078, -18.699525833129883, -18.086483001708984, -17.473440170288086, -16.860397338867188, -16.24735450744629, -15.63431167602539, -15.021268844604492, -14.408226013183594, -13.795183181762695, -13.182140350341797, -12.569097518920898, -11.9560546875, -11.343011856079102, -10.729969024658203, -10.116926193237305, -9.503883361816406, -8.890840530395508, -8.27779769897461, -7.664754867553711, -7.0517120361328125, -6.438669204711914, -5.825626373291016, -5.212583541870117, -4.599540710449219, -3.9864978790283203, -3.373455047607422, -2.7604122161865234, -2.147369384765625, -1.5343265533447266, -0.9212818145751953, -0.3082389831542969, 0.30480384826660156, 0.9178466796875, 1.5308895111083984, 2.143932342529297, 2.7569751739501953, 3.3700180053710938, 3.983060836791992, 4.596103668212891, 5.209146499633789, 5.8221893310546875, 6.435232162475586, 7.048274993896484, 7.661317825317383, 8.274360656738281, 8.88740348815918, 9.500446319580078, 10.113489151000977, 10.726531982421875, 11.339574813842773, 11.952617645263672, 12.56566047668457, 13.178703308105469, 13.791746139526367, 14.404788970947266, 15.017831802368164, 15.630874633789062, 16.24391746520996, 16.85696029663086, 17.470003128051758, 18.083045959472656, 18.696088790893555]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 10.0, 6.0, 12.0, 9.0, 15.0, 16.0, 17.0, 17.0, 33.0, 21.0, 28.0, 27.0, 33.0, 33.0, 30.0, 41.0, 43.0, 32.0, 51.0, 44.0, 36.0, 37.0, 33.0, 42.0, 36.0, 36.0, 31.0, 28.0, 29.0, 27.0, 19.0, 20.0, 19.0, 10.0, 13.0, 8.0, 14.0, 10.0, 7.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.74310302734375, -3.6190185546875, -3.49493408203125, -3.370849609375, -3.24676513671875, -3.1226806640625, -2.99859619140625, -2.87451171875, -2.75042724609375, -2.6263427734375, -2.50225830078125, -2.378173828125, -2.25408935546875, -2.1300048828125, -2.00592041015625, -1.8818359375, -1.75775146484375, -1.6336669921875, -1.50958251953125, -1.385498046875, -1.26141357421875, -1.1373291015625, -1.01324462890625, -0.88916015625, -0.76507568359375, -0.6409912109375, -0.51690673828125, -0.392822265625, -0.26873779296875, -0.1446533203125, -0.02056884765625, 0.103515625, 0.22760009765625, 0.3516845703125, 0.47576904296875, 0.599853515625, 0.72393798828125, 0.8480224609375, 0.97210693359375, 1.09619140625, 1.22027587890625, 1.3443603515625, 1.46844482421875, 1.592529296875, 1.71661376953125, 1.8406982421875, 1.96478271484375, 2.0888671875, 2.21295166015625, 2.3370361328125, 2.46112060546875, 2.585205078125, 2.70928955078125, 2.8333740234375, 2.95745849609375, 3.08154296875, 3.20562744140625, 3.3297119140625, 3.45379638671875, 3.577880859375, 3.70196533203125, 3.8260498046875, 3.95013427734375, 4.07421875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 5.0, 8.0, 5.0, 16.0, 27.0, 21.0, 41.0, 60.0, 98.0, 134.0, 196.0, 292.0, 438.0, 632.0, 910.0, 1434.0, 2152.0, 3368.0, 4951.0, 7604.0, 11870.0, 18129.0, 29093.0, 46800.0, 79641.0, 145977.0, 277181.0, 177911.0, 93070.0, 54157.0, 33106.0, 20708.0, 13486.0, 8556.0, 5490.0, 3783.0, 2454.0, 1504.0, 1018.0, 710.0, 517.0, 305.0, 223.0, 169.0, 90.0, 69.0, 45.0, 43.0, 21.0, 17.0, 6.0, 11.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0], "bins": [-0.734375, -0.7118759155273438, -0.6893768310546875, -0.6668777465820312, -0.644378662109375, -0.6218795776367188, -0.5993804931640625, -0.5768814086914062, -0.55438232421875, -0.5318832397460938, -0.5093841552734375, -0.48688507080078125, -0.464385986328125, -0.44188690185546875, -0.4193878173828125, -0.39688873291015625, -0.3743896484375, -0.35189056396484375, -0.3293914794921875, -0.30689239501953125, -0.284393310546875, -0.26189422607421875, -0.2393951416015625, -0.21689605712890625, -0.19439697265625, -0.17189788818359375, -0.1493988037109375, -0.12689971923828125, -0.104400634765625, -0.08190155029296875, -0.0594024658203125, -0.03690338134765625, -0.014404296875, 0.00809478759765625, 0.0305938720703125, 0.05309295654296875, 0.075592041015625, 0.09809112548828125, 0.1205902099609375, 0.14308929443359375, 0.16558837890625, 0.18808746337890625, 0.2105865478515625, 0.23308563232421875, 0.255584716796875, 0.27808380126953125, 0.3005828857421875, 0.32308197021484375, 0.3455810546875, 0.36808013916015625, 0.3905792236328125, 0.41307830810546875, 0.435577392578125, 0.45807647705078125, 0.4805755615234375, 0.5030746459960938, 0.52557373046875, 0.5480728149414062, 0.5705718994140625, 0.5930709838867188, 0.615570068359375, 0.6380691528320312, 0.6605682373046875, 0.6830673217773438, 0.70556640625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 9.0, 8.0, 9.0, 5.0, 12.0, 15.0, 9.0, 15.0, 23.0, 35.0, 23.0, 28.0, 41.0, 41.0, 35.0, 38.0, 35.0, 31.0, 49.0, 36.0, 1071.0, 40.0, 40.0, 36.0, 35.0, 41.0, 28.0, 24.0, 37.0, 26.0, 32.0, 20.0, 14.0, 21.0, 16.0, 8.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.83203125, -2.747344970703125, -2.66265869140625, -2.577972412109375, -2.4932861328125, -2.408599853515625, -2.32391357421875, -2.239227294921875, -2.154541015625, -2.069854736328125, -1.98516845703125, -1.900482177734375, -1.8157958984375, -1.731109619140625, -1.64642333984375, -1.561737060546875, -1.47705078125, -1.392364501953125, -1.30767822265625, -1.222991943359375, -1.1383056640625, -1.053619384765625, -0.96893310546875, -0.884246826171875, -0.799560546875, -0.714874267578125, -0.63018798828125, -0.545501708984375, -0.4608154296875, -0.376129150390625, -0.29144287109375, -0.206756591796875, -0.1220703125, -0.037384033203125, 0.04730224609375, 0.131988525390625, 0.2166748046875, 0.301361083984375, 0.38604736328125, 0.470733642578125, 0.555419921875, 0.640106201171875, 0.72479248046875, 0.809478759765625, 0.8941650390625, 0.978851318359375, 1.06353759765625, 1.148223876953125, 1.23291015625, 1.317596435546875, 1.40228271484375, 1.486968994140625, 1.5716552734375, 1.656341552734375, 1.74102783203125, 1.825714111328125, 1.910400390625, 1.995086669921875, 2.07977294921875, 2.164459228515625, 2.2491455078125, 2.333831787109375, 2.41851806640625, 2.503204345703125, 2.587890625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 13.0, 19.0, 28.0, 39.0, 61.0, 93.0, 155.0, 211.0, 334.0, 491.0, 703.0, 1066.0, 1593.0, 2403.0, 3568.0, 5539.0, 8612.0, 13501.0, 21433.0, 34299.0, 58389.0, 104573.0, 218118.0, 1319128.0, 124744.0, 68872.0, 40489.0, 24676.0, 15432.0, 9776.0, 6370.0, 4159.0, 2762.0, 1890.0, 1277.0, 814.0, 529.0, 345.0, 218.0, 149.0, 99.0, 56.0, 28.0, 33.0, 18.0, 5.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7587890625, -0.7358932495117188, -0.7129974365234375, -0.6901016235351562, -0.667205810546875, -0.6443099975585938, -0.6214141845703125, -0.5985183715820312, -0.57562255859375, -0.5527267456054688, -0.5298309326171875, -0.5069351196289062, -0.484039306640625, -0.46114349365234375, -0.4382476806640625, -0.41535186767578125, -0.3924560546875, -0.36956024169921875, -0.3466644287109375, -0.32376861572265625, -0.300872802734375, -0.27797698974609375, -0.2550811767578125, -0.23218536376953125, -0.20928955078125, -0.18639373779296875, -0.1634979248046875, -0.14060211181640625, -0.117706298828125, -0.09481048583984375, -0.0719146728515625, -0.04901885986328125, -0.026123046875, -0.00322723388671875, 0.0196685791015625, 0.04256439208984375, 0.065460205078125, 0.08835601806640625, 0.1112518310546875, 0.13414764404296875, 0.15704345703125, 0.17993927001953125, 0.2028350830078125, 0.22573089599609375, 0.248626708984375, 0.27152252197265625, 0.2944183349609375, 0.31731414794921875, 0.3402099609375, 0.36310577392578125, 0.3860015869140625, 0.40889739990234375, 0.431793212890625, 0.45468902587890625, 0.4775848388671875, 0.5004806518554688, 0.52337646484375, 0.5462722778320312, 0.5691680908203125, 0.5920639038085938, 0.614959716796875, 0.6378555297851562, 0.6607513427734375, 0.6836471557617188, 0.70654296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 5.0, 10.0, 14.0, 11.0, 13.0, 17.0, 19.0, 32.0, 32.0, 41.0, 56.0, 57.0, 63.0, 65.0, 78.0, 84.0, 71.0, 53.0, 33.0, 46.0, 41.0, 36.0, 22.0, 18.0, 15.0, 12.0, 8.0, 3.0, 15.0, 4.0, 5.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004181861877441406, -0.000403478741645813, -0.00038877129554748535, -0.0003740638494491577, -0.0003593564033508301, -0.00034464895725250244, -0.0003299415111541748, -0.00031523406505584717, -0.00030052661895751953, -0.0002858191728591919, -0.00027111172676086426, -0.0002564042806625366, -0.00024169683456420898, -0.00022698938846588135, -0.0002122819423675537, -0.00019757449626922607, -0.00018286705017089844, -0.0001681596040725708, -0.00015345215797424316, -0.00013874471187591553, -0.0001240372657775879, -0.00010932981967926025, -9.462237358093262e-05, -7.991492748260498e-05, -6.520748138427734e-05, -5.050003528594971e-05, -3.579258918762207e-05, -2.1085143089294434e-05, -6.377696990966797e-06, 8.32974910736084e-06, 2.3037195205688477e-05, 3.774464130401611e-05, 5.245208740234375e-05, 6.715953350067139e-05, 8.186697959899902e-05, 9.657442569732666e-05, 0.0001112818717956543, 0.00012598931789398193, 0.00014069676399230957, 0.0001554042100906372, 0.00017011165618896484, 0.00018481910228729248, 0.00019952654838562012, 0.00021423399448394775, 0.0002289414405822754, 0.00024364888668060303, 0.00025835633277893066, 0.0002730637788772583, 0.00028777122497558594, 0.0003024786710739136, 0.0003171861171722412, 0.00033189356327056885, 0.0003466010093688965, 0.0003613084554672241, 0.00037601590156555176, 0.0003907233476638794, 0.00040543079376220703, 0.00042013823986053467, 0.0004348456859588623, 0.00044955313205718994, 0.0004642605781555176, 0.0004789680242538452, 0.0004936754703521729, 0.0005083829164505005, 0.0005230903625488281]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 6.0, 3.0, 4.0, 5.0, 6.0, 13.0, 17.0, 20.0, 21.0, 21.0, 38.0, 41.0, 66.0, 94.0, 135.0, 198.0, 283.0, 555.0, 1271.0, 362612.0, 680038.0, 1544.0, 603.0, 303.0, 187.0, 130.0, 80.0, 67.0, 31.0, 35.0, 28.0, 26.0, 17.0, 13.0, 11.0, 6.0, 4.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.01032257080078125, -0.010043919086456299, -0.009765267372131348, -0.009486615657806396, -0.009207963943481445, -0.008929312229156494, -0.008650660514831543, -0.008372008800506592, -0.00809335708618164, -0.00781470537185669, -0.007536053657531738, -0.007257401943206787, -0.006978750228881836, -0.006700098514556885, -0.006421446800231934, -0.006142795085906982, -0.005864143371582031, -0.00558549165725708, -0.005306839942932129, -0.005028188228607178, -0.0047495365142822266, -0.004470884799957275, -0.004192233085632324, -0.003913581371307373, -0.003634929656982422, -0.0033562779426574707, -0.0030776262283325195, -0.0027989745140075684, -0.002520322799682617, -0.002241671085357666, -0.001963019371032715, -0.0016843676567077637, -0.0014057159423828125, -0.0011270642280578613, -0.0008484125137329102, -0.000569760799407959, -0.0002911090850830078, -1.245737075805664e-05, 0.00026619434356689453, 0.0005448460578918457, 0.0008234977722167969, 0.001102149486541748, 0.0013808012008666992, 0.0016594529151916504, 0.0019381046295166016, 0.0022167563438415527, 0.002495408058166504, 0.002774059772491455, 0.0030527114868164062, 0.0033313632011413574, 0.0036100149154663086, 0.0038886666297912598, 0.004167318344116211, 0.004445970058441162, 0.004724621772766113, 0.0050032734870910645, 0.005281925201416016, 0.005560576915740967, 0.005839228630065918, 0.006117880344390869, 0.00639653205871582, 0.0066751837730407715, 0.006953835487365723, 0.007232487201690674, 0.007511138916015625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 14.0, 49.0, 103.0, 199.0, 230.0, 177.0, 139.0, 57.0, 20.0, 15.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006207413389347494, -0.0006061834865249693, -0.0005916256923228502, -0.0005770678399130702, -0.0005625099875032902, -0.0005479521350935102, -0.0005333942826837301, -0.000518836488481611, -0.000504278636071831, -0.000489720783662051, -0.0004751629603561014, -0.0004606051370501518, -0.0004460472846403718, -0.0004314894322305918, -0.0004169316089246422, -0.00040237378561869264, -0.0003878159332089126, -0.0003732580807991326, -0.000358700257493183, -0.00034414243418723345, -0.0003295845817774534, -0.0003150267293676734, -0.00030046890606172383, -0.00028591108275577426, -0.00027135323034599423, -0.0002567953779362142, -0.00024223755463026464, -0.00022767971677239984, -0.00021312187891453505, -0.00019856404105667025, -0.00018400620319880545, -0.00016944836534094065, -0.00015489052748307586, -0.00014033268962521106, -0.00012577485176734626, -0.00011121701390948147, -9.665917605161667e-05, -8.210133819375187e-05, -6.754350033588707e-05, -5.298566247802228e-05, -3.842782462015748e-05, -2.3869986762292683e-05, -9.312148904427886e-06, 5.245688953436911e-06, 1.9803526811301708e-05, 3.4361364669166505e-05, 4.89192025270313e-05, 6.34770403848961e-05, 7.80348782427609e-05, 9.25927161006257e-05, 0.00010715055395849049, 0.00012170839181635529, 0.00013626622967422009, 0.00015082406753208488, 0.00016538190538994968, 0.00017993974324781448, 0.00019449758110567927, 0.00020905541896354407, 0.00022361325682140887, 0.00023817109467927366, 0.00025272893253713846, 0.0002672867849469185, 0.00028184460825286806, 0.0002964024315588176, 0.00031096028396859765]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 6.0, 7.0, 9.0, 3.0, 6.0, 11.0, 10.0, 13.0, 10.0, 17.0, 15.0, 17.0, 30.0, 32.0, 35.0, 35.0, 32.0, 24.0, 38.0, 49.0, 45.0, 29.0, 35.0, 36.0, 32.0, 35.0, 34.0, 41.0, 35.0, 30.0, 33.0, 29.0, 34.0, 21.0, 20.0, 29.0, 18.0, 13.0, 19.0, 6.0, 8.0, 3.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00019699335098266602, -0.0001905057579278946, -0.00018401816487312317, -0.00017753057181835175, -0.00017104297876358032, -0.0001645553857088089, -0.00015806779265403748, -0.00015158019959926605, -0.00014509260654449463, -0.0001386050134897232, -0.00013211742043495178, -0.00012562982738018036, -0.00011914223432540894, -0.00011265464127063751, -0.00010616704821586609, -9.967945516109467e-05, -9.319186210632324e-05, -8.670426905155182e-05, -8.02166759967804e-05, -7.372908294200897e-05, -6.724148988723755e-05, -6.0753896832466125e-05, -5.42663037776947e-05, -4.777871072292328e-05, -4.1291117668151855e-05, -3.480352461338043e-05, -2.831593155860901e-05, -2.1828338503837585e-05, -1.5340745449066162e-05, -8.853152394294739e-06, -2.3655593395233154e-06, 4.122033715248108e-06, 1.0609626770019531e-05, 1.7097219824790955e-05, 2.3584812879562378e-05, 3.00724059343338e-05, 3.6559998989105225e-05, 4.304759204387665e-05, 4.953518509864807e-05, 5.6022778153419495e-05, 6.251037120819092e-05, 6.899796426296234e-05, 7.548555731773376e-05, 8.197315037250519e-05, 8.846074342727661e-05, 9.494833648204803e-05, 0.00010143592953681946, 0.00010792352259159088, 0.0001144111156463623, 0.00012089870870113373, 0.00012738630175590515, 0.00013387389481067657, 0.000140361487865448, 0.00014684908092021942, 0.00015333667397499084, 0.00015982426702976227, 0.0001663118600845337, 0.00017279945313930511, 0.00017928704619407654, 0.00018577463924884796, 0.00019226223230361938, 0.0001987498253583908, 0.00020523741841316223, 0.00021172501146793365, 0.00021821260452270508]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 10.0, 6.0, 12.0, 9.0, 15.0, 16.0, 17.0, 17.0, 33.0, 21.0, 28.0, 27.0, 33.0, 33.0, 30.0, 41.0, 43.0, 32.0, 51.0, 44.0, 36.0, 37.0, 33.0, 42.0, 36.0, 36.0, 31.0, 28.0, 29.0, 27.0, 19.0, 20.0, 19.0, 10.0, 13.0, 8.0, 14.0, 10.0, 7.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.74310302734375, -3.6190185546875, -3.49493408203125, -3.370849609375, -3.24676513671875, -3.1226806640625, -2.99859619140625, -2.87451171875, -2.75042724609375, -2.6263427734375, -2.50225830078125, -2.378173828125, -2.25408935546875, -2.1300048828125, -2.00592041015625, -1.8818359375, -1.75775146484375, -1.6336669921875, -1.50958251953125, -1.385498046875, -1.26141357421875, -1.1373291015625, -1.01324462890625, -0.88916015625, -0.76507568359375, -0.6409912109375, -0.51690673828125, -0.392822265625, -0.26873779296875, -0.1446533203125, -0.02056884765625, 0.103515625, 0.22760009765625, 0.3516845703125, 0.47576904296875, 0.599853515625, 0.72393798828125, 0.8480224609375, 0.97210693359375, 1.09619140625, 1.22027587890625, 1.3443603515625, 1.46844482421875, 1.592529296875, 1.71661376953125, 1.8406982421875, 1.96478271484375, 2.0888671875, 2.21295166015625, 2.3370361328125, 2.46112060546875, 2.585205078125, 2.70928955078125, 2.8333740234375, 2.95745849609375, 3.08154296875, 3.20562744140625, 3.3297119140625, 3.45379638671875, 3.577880859375, 3.70196533203125, 3.8260498046875, 3.95013427734375, 4.07421875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 8.0, 3.0, 6.0, 9.0, 15.0, 22.0, 30.0, 39.0, 57.0, 61.0, 64.0, 97.0, 124.0, 192.0, 253.0, 346.0, 500.0, 767.0, 1344.0, 2880.0, 6768.0, 20609.0, 68648.0, 207210.0, 379909.0, 237712.0, 81141.0, 24673.0, 7712.0, 3034.0, 1558.0, 868.0, 510.0, 351.0, 267.0, 177.0, 140.0, 102.0, 107.0, 65.0, 39.0, 41.0, 23.0, 18.0, 19.0, 18.0, 6.0, 9.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.0390625, -4.87945556640625, -4.7198486328125, -4.56024169921875, -4.400634765625, -4.24102783203125, -4.0814208984375, -3.92181396484375, -3.76220703125, -3.60260009765625, -3.4429931640625, -3.28338623046875, -3.123779296875, -2.96417236328125, -2.8045654296875, -2.64495849609375, -2.4853515625, -2.32574462890625, -2.1661376953125, -2.00653076171875, -1.846923828125, -1.68731689453125, -1.5277099609375, -1.36810302734375, -1.20849609375, -1.04888916015625, -0.8892822265625, -0.72967529296875, -0.570068359375, -0.41046142578125, -0.2508544921875, -0.09124755859375, 0.068359375, 0.22796630859375, 0.3875732421875, 0.54718017578125, 0.706787109375, 0.86639404296875, 1.0260009765625, 1.18560791015625, 1.34521484375, 1.50482177734375, 1.6644287109375, 1.82403564453125, 1.983642578125, 2.14324951171875, 2.3028564453125, 2.46246337890625, 2.6220703125, 2.78167724609375, 2.9412841796875, 3.10089111328125, 3.260498046875, 3.42010498046875, 3.5797119140625, 3.73931884765625, 3.89892578125, 4.05853271484375, 4.2181396484375, 4.37774658203125, 4.537353515625, 4.69696044921875, 4.8565673828125, 5.01617431640625, 5.17578125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 10.0, 7.0, 16.0, 14.0, 16.0, 23.0, 27.0, 27.0, 30.0, 33.0, 41.0, 52.0, 54.0, 77.0, 162.0, 323.0, 1413.0, 185.0, 87.0, 73.0, 57.0, 48.0, 39.0, 44.0, 38.0, 22.0, 27.0, 22.0, 14.0, 13.0, 5.0, 8.0, 4.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.8125, -11.4320068359375, -11.051513671875, -10.6710205078125, -10.29052734375, -9.9100341796875, -9.529541015625, -9.1490478515625, -8.7685546875, -8.3880615234375, -8.007568359375, -7.6270751953125, -7.24658203125, -6.8660888671875, -6.485595703125, -6.1051025390625, -5.724609375, -5.3441162109375, -4.963623046875, -4.5831298828125, -4.20263671875, -3.8221435546875, -3.441650390625, -3.0611572265625, -2.6806640625, -2.3001708984375, -1.919677734375, -1.5391845703125, -1.15869140625, -0.7781982421875, -0.397705078125, -0.0172119140625, 0.36328125, 0.7437744140625, 1.124267578125, 1.5047607421875, 1.88525390625, 2.2657470703125, 2.646240234375, 3.0267333984375, 3.4072265625, 3.7877197265625, 4.168212890625, 4.5487060546875, 4.92919921875, 5.3096923828125, 5.690185546875, 6.0706787109375, 6.451171875, 6.8316650390625, 7.212158203125, 7.5926513671875, 7.97314453125, 8.3536376953125, 8.734130859375, 9.1146240234375, 9.4951171875, 9.8756103515625, 10.256103515625, 10.6365966796875, 11.01708984375, 11.3975830078125, 11.778076171875, 12.1585693359375, 12.5390625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 3.0, 15.0, 12.0, 17.0, 30.0, 40.0, 49.0, 71.0, 86.0, 132.0, 249.0, 356.0, 612.0, 1252.0, 6442.0, 2666720.0, 463996.0, 3304.0, 896.0, 480.0, 305.0, 208.0, 135.0, 85.0, 55.0, 42.0, 33.0, 15.0, 25.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.953125, -30.09033203125, -29.2275390625, -28.36474609375, -27.501953125, -26.63916015625, -25.7763671875, -24.91357421875, -24.05078125, -23.18798828125, -22.3251953125, -21.46240234375, -20.599609375, -19.73681640625, -18.8740234375, -18.01123046875, -17.1484375, -16.28564453125, -15.4228515625, -14.56005859375, -13.697265625, -12.83447265625, -11.9716796875, -11.10888671875, -10.24609375, -9.38330078125, -8.5205078125, -7.65771484375, -6.794921875, -5.93212890625, -5.0693359375, -4.20654296875, -3.34375, -2.48095703125, -1.6181640625, -0.75537109375, 0.107421875, 0.97021484375, 1.8330078125, 2.69580078125, 3.55859375, 4.42138671875, 5.2841796875, 6.14697265625, 7.009765625, 7.87255859375, 8.7353515625, 9.59814453125, 10.4609375, 11.32373046875, 12.1865234375, 13.04931640625, 13.912109375, 14.77490234375, 15.6376953125, 16.50048828125, 17.36328125, 18.22607421875, 19.0888671875, 19.95166015625, 20.814453125, 21.67724609375, 22.5400390625, 23.40283203125, 24.265625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 91.0, 584.0, 316.0, 17.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.23248291015625, -66.64657592773438, -64.0606689453125, -61.474761962890625, -58.888858795166016, -56.30295181274414, -53.717044830322266, -51.131141662597656, -48.54523468017578, -45.959327697753906, -43.37342071533203, -40.787513732910156, -38.20161056518555, -35.61570358276367, -33.0297966003418, -30.443891525268555, -27.857982635498047, -25.272075653076172, -22.68617057800293, -20.100263595581055, -17.514358520507812, -14.928451538085938, -12.342544555664062, -9.75663948059082, -7.170732498168945, -4.584826469421387, -1.99891996383667, 0.5869865417480469, 3.1728925704956055, 5.758798599243164, 8.344705581665039, 10.930610656738281, 13.516517639160156, 16.10242462158203, 18.688329696655273, 21.27423667907715, 23.86014175415039, 26.446048736572266, 29.03195571899414, 31.617860794067383, 34.203765869140625, 36.7896728515625, 39.375579833984375, 41.96148681640625, 44.54738998413086, 47.133296966552734, 49.71920394897461, 52.30510711669922, 54.89101791381836, 57.476924896240234, 60.06283187866211, 62.64873504638672, 65.2346420288086, 67.82054901123047, 70.40645599365234, 72.99236297607422, 75.5782699584961, 78.16417694091797, 80.75008392333984, 83.33599090576172, 85.9218978881836, 88.50779724121094, 91.09370422363281, 93.67961120605469, 96.26551818847656]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 9.0, 7.0, 11.0, 16.0, 25.0, 24.0, 25.0, 22.0, 30.0, 31.0, 36.0, 43.0, 41.0, 43.0, 45.0, 49.0, 59.0, 38.0, 54.0, 54.0, 42.0, 35.0, 35.0, 25.0, 23.0, 38.0, 27.0, 21.0, 14.0, 18.0, 12.0, 13.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.111183166503906, -21.219919204711914, -20.328655242919922, -19.437393188476562, -18.54612922668457, -17.654865264892578, -16.76360321044922, -15.872339248657227, -14.981075286865234, -14.089811325073242, -13.198548316955566, -12.30728530883789, -11.416021347045898, -10.524757385253906, -9.63349437713623, -8.742231369018555, -7.8509674072265625, -6.9597039222717285, -6.0684404373168945, -5.1771769523620605, -4.285913467407227, -3.3946499824523926, -2.5033864974975586, -1.6121230125427246, -0.7208595275878906, 0.17040395736694336, 1.0616674423217773, 1.9529309272766113, 2.8441944122314453, 3.7354578971862793, 4.626721382141113, 5.517984867095947, 6.409248352050781, 7.300511837005615, 8.19177532196045, 9.083038330078125, 9.974302291870117, 10.86556625366211, 11.756829261779785, 12.648092269897461, 13.539356231689453, 14.430620193481445, 15.321883201599121, 16.213146209716797, 17.10441017150879, 17.99567413330078, 18.88693618774414, 19.778200149536133, 20.669464111328125, 21.560728073120117, 22.45199203491211, 23.34325408935547, 24.23451805114746, 25.125782012939453, 26.017044067382812, 26.908308029174805, 27.799571990966797, 28.69083595275879, 29.58209991455078, 30.47336196899414, 31.364625930786133, 32.255889892578125, 33.147151947021484, 34.03841781616211, 34.92967987060547]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 11.0, 15.0, 16.0, 17.0, 21.0, 22.0, 29.0, 27.0, 30.0, 29.0, 39.0, 32.0, 36.0, 36.0, 45.0, 52.0, 41.0, 52.0, 31.0, 35.0, 47.0, 39.0, 25.0, 26.0, 26.0, 35.0, 22.0, 23.0, 25.0, 18.0, 13.0, 5.0, 14.0, 6.0, 13.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.935546875, -3.810150146484375, -3.68475341796875, -3.559356689453125, -3.4339599609375, -3.308563232421875, -3.18316650390625, -3.057769775390625, -2.932373046875, -2.806976318359375, -2.68157958984375, -2.556182861328125, -2.4307861328125, -2.305389404296875, -2.17999267578125, -2.054595947265625, -1.92919921875, -1.803802490234375, -1.67840576171875, -1.553009033203125, -1.4276123046875, -1.302215576171875, -1.17681884765625, -1.051422119140625, -0.926025390625, -0.800628662109375, -0.67523193359375, -0.549835205078125, -0.4244384765625, -0.299041748046875, -0.17364501953125, -0.048248291015625, 0.0771484375, 0.202545166015625, 0.32794189453125, 0.453338623046875, 0.5787353515625, 0.704132080078125, 0.82952880859375, 0.954925537109375, 1.080322265625, 1.205718994140625, 1.33111572265625, 1.456512451171875, 1.5819091796875, 1.707305908203125, 1.83270263671875, 1.958099365234375, 2.08349609375, 2.208892822265625, 2.33428955078125, 2.459686279296875, 2.5850830078125, 2.710479736328125, 2.83587646484375, 2.961273193359375, 3.086669921875, 3.212066650390625, 3.33746337890625, 3.462860107421875, 3.5882568359375, 3.713653564453125, 3.83905029296875, 3.964447021484375, 4.08984375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 4.0, 3.0, 7.0, 7.0, 9.0, 14.0, 10.0, 19.0, 24.0, 28.0, 25.0, 34.0, 36.0, 61.0, 75.0, 100.0, 129.0, 179.0, 236.0, 258.0, 340.0, 599.0, 25928.0, 4161698.0, 2541.0, 438.0, 319.0, 251.0, 214.0, 152.0, 101.0, 92.0, 58.0, 52.0, 51.0, 30.0, 31.0, 25.0, 21.0, 13.0, 13.0, 8.0, 10.0, 11.0, 6.0, 6.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-40.53125, -39.150390625, -37.76953125, -36.388671875, -35.0078125, -33.626953125, -32.24609375, -30.865234375, -29.484375, -28.103515625, -26.72265625, -25.341796875, -23.9609375, -22.580078125, -21.19921875, -19.818359375, -18.4375, -17.056640625, -15.67578125, -14.294921875, -12.9140625, -11.533203125, -10.15234375, -8.771484375, -7.390625, -6.009765625, -4.62890625, -3.248046875, -1.8671875, -0.486328125, 0.89453125, 2.275390625, 3.65625, 5.037109375, 6.41796875, 7.798828125, 9.1796875, 10.560546875, 11.94140625, 13.322265625, 14.703125, 16.083984375, 17.46484375, 18.845703125, 20.2265625, 21.607421875, 22.98828125, 24.369140625, 25.75, 27.130859375, 28.51171875, 29.892578125, 31.2734375, 32.654296875, 34.03515625, 35.416015625, 36.796875, 38.177734375, 39.55859375, 40.939453125, 42.3203125, 43.701171875, 45.08203125, 46.462890625, 47.84375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 3.0, 10.0, 12.0, 9.0, 22.0, 28.0, 40.0, 62.0, 85.0, 134.0, 164.0, 241.0, 374.0, 496.0, 593.0, 565.0, 371.0, 242.0, 162.0, 122.0, 100.0, 48.0, 47.0, 39.0, 18.0, 26.0, 9.0, 13.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.61328125, -5.4095458984375, -5.205810546875, -5.0020751953125, -4.79833984375, -4.5946044921875, -4.390869140625, -4.1871337890625, -3.9833984375, -3.7796630859375, -3.575927734375, -3.3721923828125, -3.16845703125, -2.9647216796875, -2.760986328125, -2.5572509765625, -2.353515625, -2.1497802734375, -1.946044921875, -1.7423095703125, -1.53857421875, -1.3348388671875, -1.131103515625, -0.9273681640625, -0.7236328125, -0.5198974609375, -0.316162109375, -0.1124267578125, 0.09130859375, 0.2950439453125, 0.498779296875, 0.7025146484375, 0.90625, 1.1099853515625, 1.313720703125, 1.5174560546875, 1.72119140625, 1.9249267578125, 2.128662109375, 2.3323974609375, 2.5361328125, 2.7398681640625, 2.943603515625, 3.1473388671875, 3.35107421875, 3.5548095703125, 3.758544921875, 3.9622802734375, 4.166015625, 4.3697509765625, 4.573486328125, 4.7772216796875, 4.98095703125, 5.1846923828125, 5.388427734375, 5.5921630859375, 5.7958984375, 5.9996337890625, 6.203369140625, 6.4071044921875, 6.61083984375, 6.8145751953125, 7.018310546875, 7.2220458984375, 7.42578125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 3.0, 15.0, 17.0, 10.0, 17.0, 35.0, 46.0, 53.0, 77.0, 104.0, 224.0, 789.0, 27606.0, 4117399.0, 46294.0, 955.0, 222.0, 95.0, 63.0, 69.0, 43.0, 29.0, 22.0, 18.0, 15.0, 9.0, 11.0, 9.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.5, -38.44775390625, -37.3955078125, -36.34326171875, -35.291015625, -34.23876953125, -33.1865234375, -32.13427734375, -31.08203125, -30.02978515625, -28.9775390625, -27.92529296875, -26.873046875, -25.82080078125, -24.7685546875, -23.71630859375, -22.6640625, -21.61181640625, -20.5595703125, -19.50732421875, -18.455078125, -17.40283203125, -16.3505859375, -15.29833984375, -14.24609375, -13.19384765625, -12.1416015625, -11.08935546875, -10.037109375, -8.98486328125, -7.9326171875, -6.88037109375, -5.828125, -4.77587890625, -3.7236328125, -2.67138671875, -1.619140625, -0.56689453125, 0.4853515625, 1.53759765625, 2.58984375, 3.64208984375, 4.6943359375, 5.74658203125, 6.798828125, 7.85107421875, 8.9033203125, 9.95556640625, 11.0078125, 12.06005859375, 13.1123046875, 14.16455078125, 15.216796875, 16.26904296875, 17.3212890625, 18.37353515625, 19.42578125, 20.47802734375, 21.5302734375, 22.58251953125, 23.634765625, 24.68701171875, 25.7392578125, 26.79150390625, 27.84375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 142.0, 685.0, 175.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-213.35162353515625, -209.44268798828125, -205.53375244140625, -201.6248016357422, -197.7158660888672, -193.8069305419922, -189.89797973632812, -185.98904418945312, -182.08010864257812, -178.17117309570312, -174.26223754882812, -170.35328674316406, -166.44435119628906, -162.53541564941406, -158.62646484375, -154.717529296875, -150.80859375, -146.899658203125, -142.99072265625, -139.08177185058594, -135.17283630371094, -131.26390075683594, -127.3549575805664, -123.44601440429688, -119.53707885742188, -115.62814331054688, -111.71920013427734, -107.81025695800781, -103.90132141113281, -99.99238586425781, -96.08344268798828, -92.17449951171875, -88.26556396484375, -84.35662841796875, -80.44768524169922, -76.53874206542969, -72.62980651855469, -68.72087097167969, -64.81192779541016, -60.90298843383789, -56.994049072265625, -53.08510971069336, -49.176170349121094, -45.26723098754883, -41.35829162597656, -37.4493522644043, -33.54041290283203, -29.631473541259766, -25.7225341796875, -21.813594818115234, -17.90465545654297, -13.995716094970703, -10.086776733398438, -6.177837371826172, -2.2688980102539062, 1.6400413513183594, 5.548980712890625, 9.45792007446289, 13.366859436035156, 17.275798797607422, 21.184738159179688, 25.093677520751953, 29.00261688232422, 32.911556243896484, 36.82049560546875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 7.0, 3.0, 11.0, 11.0, 14.0, 12.0, 11.0, 16.0, 22.0, 27.0, 26.0, 32.0, 38.0, 45.0, 32.0, 36.0, 52.0, 56.0, 42.0, 41.0, 44.0, 47.0, 44.0, 40.0, 45.0, 21.0, 27.0, 29.0, 27.0, 24.0, 23.0, 15.0, 18.0, 10.0, 10.0, 8.0, 10.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.761035919189453, -19.073503494262695, -18.385971069335938, -17.69843864440918, -17.010906219482422, -16.323373794555664, -15.635842323303223, -14.948309898376465, -14.260777473449707, -13.57324504852295, -12.885712623596191, -12.19818115234375, -11.510648727416992, -10.823116302490234, -10.135583877563477, -9.448051452636719, -8.760519027709961, -8.072986602783203, -7.385454177856445, -6.697922229766846, -6.010389804840088, -5.32285737991333, -4.6353254318237305, -3.9477930068969727, -3.260260581970215, -2.572728157043457, -1.8851959705352783, -1.1976637840270996, -0.5101313591003418, 0.17740106582641602, 0.8649330139160156, 1.5524654388427734, 2.2399978637695312, 2.927530288696289, 3.6150624752044678, 4.3025946617126465, 4.990127086639404, 5.677659511566162, 6.365191459655762, 7.0527238845825195, 7.740256309509277, 8.427788734436035, 9.115321159362793, 9.802852630615234, 10.490385055541992, 11.17791748046875, 11.865449905395508, 12.552982330322266, 13.240514755249023, 13.928047180175781, 14.615579605102539, 15.303112030029297, 15.990644454956055, 16.678176879882812, 17.365707397460938, 18.053241729736328, 18.740772247314453, 19.42830467224121, 20.11583709716797, 20.803369522094727, 21.490901947021484, 22.178434371948242, 22.865966796875, 23.553497314453125, 24.241031646728516]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 6.0, 8.0, 19.0, 11.0, 14.0, 15.0, 25.0, 26.0, 22.0, 26.0, 30.0, 29.0, 33.0, 47.0, 41.0, 39.0, 60.0, 47.0, 40.0, 48.0, 39.0, 52.0, 31.0, 40.0, 35.0, 33.0, 33.0, 24.0, 23.0, 21.0, 14.0, 10.0, 9.0, 5.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.0982666015625, -2.973876953125, -2.8494873046875, -2.72509765625, -2.6007080078125, -2.476318359375, -2.3519287109375, -2.2275390625, -2.1031494140625, -1.978759765625, -1.8543701171875, -1.72998046875, -1.6055908203125, -1.481201171875, -1.3568115234375, -1.232421875, -1.1080322265625, -0.983642578125, -0.8592529296875, -0.73486328125, -0.6104736328125, -0.486083984375, -0.3616943359375, -0.2373046875, -0.1129150390625, 0.011474609375, 0.1358642578125, 0.26025390625, 0.3846435546875, 0.509033203125, 0.6334228515625, 0.7578125, 0.8822021484375, 1.006591796875, 1.1309814453125, 1.25537109375, 1.3797607421875, 1.504150390625, 1.6285400390625, 1.7529296875, 1.8773193359375, 2.001708984375, 2.1260986328125, 2.25048828125, 2.3748779296875, 2.499267578125, 2.6236572265625, 2.748046875, 2.8724365234375, 2.996826171875, 3.1212158203125, 3.24560546875, 3.3699951171875, 3.494384765625, 3.6187744140625, 3.7431640625, 3.8675537109375, 3.991943359375, 4.1163330078125, 4.24072265625, 4.3651123046875, 4.489501953125, 4.6138916015625, 4.73828125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 11.0, 15.0, 22.0, 22.0, 45.0, 55.0, 101.0, 138.0, 199.0, 344.0, 491.0, 831.0, 1196.0, 1979.0, 3070.0, 5110.0, 8209.0, 13514.0, 22336.0, 39223.0, 73963.0, 152494.0, 319746.0, 197485.0, 92267.0, 47844.0, 26828.0, 15707.0, 9450.0, 5811.0, 3616.0, 2281.0, 1464.0, 959.0, 646.0, 402.0, 245.0, 127.0, 112.0, 69.0, 54.0, 16.0, 20.0, 14.0, 13.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.796875, -0.7724761962890625, -0.748077392578125, -0.7236785888671875, -0.69927978515625, -0.6748809814453125, -0.650482177734375, -0.6260833740234375, -0.6016845703125, -0.5772857666015625, -0.552886962890625, -0.5284881591796875, -0.50408935546875, -0.4796905517578125, -0.455291748046875, -0.4308929443359375, -0.406494140625, -0.3820953369140625, -0.357696533203125, -0.3332977294921875, -0.30889892578125, -0.2845001220703125, -0.260101318359375, -0.2357025146484375, -0.2113037109375, -0.1869049072265625, -0.162506103515625, -0.1381072998046875, -0.11370849609375, -0.0893096923828125, -0.064910888671875, -0.0405120849609375, -0.01611328125, 0.0082855224609375, 0.032684326171875, 0.0570831298828125, 0.08148193359375, 0.1058807373046875, 0.130279541015625, 0.1546783447265625, 0.1790771484375, 0.2034759521484375, 0.227874755859375, 0.2522735595703125, 0.27667236328125, 0.3010711669921875, 0.325469970703125, 0.3498687744140625, 0.374267578125, 0.3986663818359375, 0.423065185546875, 0.4474639892578125, 0.47186279296875, 0.4962615966796875, 0.520660400390625, 0.5450592041015625, 0.5694580078125, 0.5938568115234375, 0.618255615234375, 0.6426544189453125, 0.66705322265625, 0.6914520263671875, 0.715850830078125, 0.7402496337890625, 0.7646484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 7.0, 8.0, 9.0, 11.0, 11.0, 13.0, 14.0, 23.0, 16.0, 18.0, 24.0, 21.0, 32.0, 25.0, 27.0, 44.0, 35.0, 38.0, 40.0, 50.0, 1067.0, 61.0, 38.0, 39.0, 41.0, 35.0, 36.0, 37.0, 23.0, 18.0, 21.0, 23.0, 23.0, 20.0, 12.0, 14.0, 6.0, 10.0, 7.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.3203125, -2.2471923828125, -2.174072265625, -2.1009521484375, -2.02783203125, -1.9547119140625, -1.881591796875, -1.8084716796875, -1.7353515625, -1.6622314453125, -1.589111328125, -1.5159912109375, -1.44287109375, -1.3697509765625, -1.296630859375, -1.2235107421875, -1.150390625, -1.0772705078125, -1.004150390625, -0.9310302734375, -0.85791015625, -0.7847900390625, -0.711669921875, -0.6385498046875, -0.5654296875, -0.4923095703125, -0.419189453125, -0.3460693359375, -0.27294921875, -0.1998291015625, -0.126708984375, -0.0535888671875, 0.01953125, 0.0926513671875, 0.165771484375, 0.2388916015625, 0.31201171875, 0.3851318359375, 0.458251953125, 0.5313720703125, 0.6044921875, 0.6776123046875, 0.750732421875, 0.8238525390625, 0.89697265625, 0.9700927734375, 1.043212890625, 1.1163330078125, 1.189453125, 1.2625732421875, 1.335693359375, 1.4088134765625, 1.48193359375, 1.5550537109375, 1.628173828125, 1.7012939453125, 1.7744140625, 1.8475341796875, 1.920654296875, 1.9937744140625, 2.06689453125, 2.1400146484375, 2.213134765625, 2.2862548828125, 2.359375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 14.0, 32.0, 42.0, 59.0, 84.0, 136.0, 218.0, 319.0, 469.0, 659.0, 1035.0, 1457.0, 2113.0, 3105.0, 4614.0, 7044.0, 10474.0, 16266.0, 25365.0, 41641.0, 72567.0, 143572.0, 1354955.0, 187743.0, 88379.0, 49409.0, 29877.0, 18768.0, 12129.0, 8035.0, 5419.0, 3652.0, 2514.0, 1667.0, 1079.0, 747.0, 473.0, 333.0, 224.0, 136.0, 92.0, 64.0, 54.0, 27.0, 20.0, 20.0, 9.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.63671875, -0.616607666015625, -0.59649658203125, -0.576385498046875, -0.5562744140625, -0.536163330078125, -0.51605224609375, -0.495941162109375, -0.475830078125, -0.455718994140625, -0.43560791015625, -0.415496826171875, -0.3953857421875, -0.375274658203125, -0.35516357421875, -0.335052490234375, -0.31494140625, -0.294830322265625, -0.27471923828125, -0.254608154296875, -0.2344970703125, -0.214385986328125, -0.19427490234375, -0.174163818359375, -0.154052734375, -0.133941650390625, -0.11383056640625, -0.093719482421875, -0.0736083984375, -0.053497314453125, -0.03338623046875, -0.013275146484375, 0.0068359375, 0.026947021484375, 0.04705810546875, 0.067169189453125, 0.0872802734375, 0.107391357421875, 0.12750244140625, 0.147613525390625, 0.167724609375, 0.187835693359375, 0.20794677734375, 0.228057861328125, 0.2481689453125, 0.268280029296875, 0.28839111328125, 0.308502197265625, 0.32861328125, 0.348724365234375, 0.36883544921875, 0.388946533203125, 0.4090576171875, 0.429168701171875, 0.44927978515625, 0.469390869140625, 0.489501953125, 0.509613037109375, 0.52972412109375, 0.549835205078125, 0.5699462890625, 0.590057373046875, 0.61016845703125, 0.630279541015625, 0.650390625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 12.0, 7.0, 16.0, 20.0, 24.0, 29.0, 35.0, 37.0, 37.0, 44.0, 50.0, 78.0, 67.0, 68.0, 69.0, 56.0, 48.0, 34.0, 36.0, 37.0, 35.0, 29.0, 20.0, 24.0, 14.0, 8.0, 12.0, 8.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00043845176696777344, -0.0004248395562171936, -0.00041122734546661377, -0.00039761513471603394, -0.0003840029239654541, -0.00037039071321487427, -0.00035677850246429443, -0.0003431662917137146, -0.00032955408096313477, -0.00031594187021255493, -0.0003023296594619751, -0.00028871744871139526, -0.00027510523796081543, -0.0002614930272102356, -0.00024788081645965576, -0.00023426860570907593, -0.0002206563949584961, -0.00020704418420791626, -0.00019343197345733643, -0.0001798197627067566, -0.00016620755195617676, -0.00015259534120559692, -0.0001389831304550171, -0.00012537091970443726, -0.00011175870895385742, -9.814649820327759e-05, -8.453428745269775e-05, -7.092207670211792e-05, -5.7309865951538086e-05, -4.369765520095825e-05, -3.0085444450378418e-05, -1.6473233699798584e-05, -2.86102294921875e-06, 1.0751187801361084e-05, 2.4363398551940918e-05, 3.797560930252075e-05, 5.1587820053100586e-05, 6.520003080368042e-05, 7.881224155426025e-05, 9.242445230484009e-05, 0.00010603666305541992, 0.00011964887380599976, 0.0001332610845565796, 0.00014687329530715942, 0.00016048550605773926, 0.0001740977168083191, 0.00018770992755889893, 0.00020132213830947876, 0.0002149343490600586, 0.00022854655981063843, 0.00024215877056121826, 0.0002557709813117981, 0.00026938319206237793, 0.00028299540281295776, 0.0002966076135635376, 0.00031021982431411743, 0.00032383203506469727, 0.0003374442458152771, 0.00035105645656585693, 0.00036466866731643677, 0.0003782808780670166, 0.00039189308881759644, 0.00040550529956817627, 0.0004191175103187561, 0.00043272972106933594]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 8.0, 5.0, 11.0, 12.0, 9.0, 14.0, 28.0, 31.0, 33.0, 56.0, 67.0, 74.0, 83.0, 124.0, 181.0, 329.0, 524.0, 875.0, 3530.0, 1000709.0, 38818.0, 1150.0, 639.0, 365.0, 235.0, 161.0, 106.0, 91.0, 49.0, 52.0, 52.0, 21.0, 16.0, 23.0, 14.0, 12.0, 7.0, 5.0, 3.0, 5.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00760650634765625, -0.007373809814453125, -0.00714111328125, -0.006908416748046875, -0.00667572021484375, -0.006443023681640625, -0.0062103271484375, -0.005977630615234375, -0.00574493408203125, -0.005512237548828125, -0.005279541015625, -0.005046844482421875, -0.00481414794921875, -0.004581451416015625, -0.0043487548828125, -0.004116058349609375, -0.00388336181640625, -0.003650665283203125, -0.00341796875, -0.003185272216796875, -0.00295257568359375, -0.002719879150390625, -0.0024871826171875, -0.002254486083984375, -0.00202178955078125, -0.001789093017578125, -0.001556396484375, -0.001323699951171875, -0.00109100341796875, -0.000858306884765625, -0.0006256103515625, -0.000392913818359375, -0.00016021728515625, 7.2479248046875e-05, 0.00030517578125, 0.000537872314453125, 0.00077056884765625, 0.001003265380859375, 0.0012359619140625, 0.001468658447265625, 0.00170135498046875, 0.001934051513671875, 0.002166748046875, 0.002399444580078125, 0.00263214111328125, 0.002864837646484375, 0.0030975341796875, 0.003330230712890625, 0.00356292724609375, 0.003795623779296875, 0.0040283203125, 0.004261016845703125, 0.00449371337890625, 0.004726409912109375, 0.0049591064453125, 0.005191802978515625, 0.00542449951171875, 0.005657196044921875, 0.005889892578125, 0.006122589111328125, 0.00635528564453125, 0.006587982177734375, 0.0068206787109375, 0.007053375244140625, 0.00728607177734375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 14.0, 372.0, 565.0, 60.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002532385056838393, -0.0024828817695379257, -0.0024333782494068146, -0.002383874962106347, -0.002334371441975236, -0.0022848681546747684, -0.0022353646345436573, -0.00218586134724319, -0.0021363578271120787, -0.002086854539811611, -0.0020373510196805, -0.0019878477323800325, -0.0019383442122489214, -0.001888840808533132, -0.0018393374048173428, -0.0017898340011015534, -0.0017403305973857641, -0.0016908271936699748, -0.0016413237899541855, -0.0015918203862383962, -0.0015423169825226068, -0.0014928135788068175, -0.0014433101750910282, -0.001393806771375239, -0.0013443034840747714, -0.001294800080358982, -0.0012452966766431928, -0.0011957932729274035, -0.0011462898692116141, -0.0010967864654958248, -0.0010472830617800355, -0.0009977796580642462, -0.0009482763125561178, -0.0008987729088403285, -0.0008492695051245391, -0.0007997661014087498, -0.0007502626976929605, -0.0007007593521848321, -0.0006512559484690428, -0.0006017525447532535, -0.0005522491410374641, -0.0005027457373216748, -0.0004532423336058855, -0.0004037389298900962, -0.00035423552617430687, -0.000304732151562348, -0.0002552287478465587, -0.00020572534413076937, -0.0001562219113111496, -0.00010671850759536028, -5.7215111155528575e-05, -7.711714715696871e-06, 4.179168900009245e-05, 9.129507816396654e-05, 0.00014079848187975585, 0.00019030188559554517, 0.0002398052893113345, 0.0002893086930271238, 0.0003388120967429131, 0.000388315471354872, 0.0004378188750706613, 0.0004873222787864506, 0.0005368256825022399, 0.0005863290862180293, 0.0006358324899338186]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 9.0, 10.0, 8.0, 7.0, 12.0, 18.0, 13.0, 16.0, 26.0, 18.0, 41.0, 32.0, 35.0, 34.0, 43.0, 40.0, 46.0, 43.0, 41.0, 43.0, 40.0, 44.0, 46.0, 37.0, 50.0, 36.0, 44.0, 31.0, 19.0, 28.0, 9.0, 11.0, 12.0, 12.0, 11.0, 7.0, 8.0, 5.0, 6.0, 1.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022596120834350586, -0.00021848827600479126, -0.00021101534366607666, -0.00020354241132736206, -0.00019606947898864746, -0.00018859654664993286, -0.00018112361431121826, -0.00017365068197250366, -0.00016617774963378906, -0.00015870481729507446, -0.00015123188495635986, -0.00014375895261764526, -0.00013628602027893066, -0.00012881308794021606, -0.00012134015560150146, -0.00011386722326278687, -0.00010639429092407227, -9.892135858535767e-05, -9.144842624664307e-05, -8.397549390792847e-05, -7.650256156921387e-05, -6.902962923049927e-05, -6.155669689178467e-05, -5.408376455307007e-05, -4.661083221435547e-05, -3.913789987564087e-05, -3.166496753692627e-05, -2.419203519821167e-05, -1.671910285949707e-05, -9.24617052078247e-06, -1.773238182067871e-06, 5.6996941566467285e-06, 1.3172626495361328e-05, 2.0645558834075928e-05, 2.8118491172790527e-05, 3.559142351150513e-05, 4.3064355850219727e-05, 5.0537288188934326e-05, 5.8010220527648926e-05, 6.548315286636353e-05, 7.295608520507812e-05, 8.042901754379272e-05, 8.790194988250732e-05, 9.537488222122192e-05, 0.00010284781455993652, 0.00011032074689865112, 0.00011779367923736572, 0.00012526661157608032, 0.00013273954391479492, 0.00014021247625350952, 0.00014768540859222412, 0.00015515834093093872, 0.00016263127326965332, 0.00017010420560836792, 0.00017757713794708252, 0.00018505007028579712, 0.00019252300262451172, 0.00019999593496322632, 0.00020746886730194092, 0.00021494179964065552, 0.00022241473197937012, 0.00022988766431808472, 0.00023736059665679932, 0.0002448335289955139, 0.0002523064613342285]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 6.0, 8.0, 19.0, 11.0, 14.0, 15.0, 25.0, 26.0, 22.0, 26.0, 30.0, 29.0, 33.0, 47.0, 41.0, 39.0, 60.0, 47.0, 40.0, 48.0, 39.0, 52.0, 31.0, 40.0, 35.0, 33.0, 33.0, 24.0, 23.0, 21.0, 14.0, 10.0, 9.0, 5.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.0982666015625, -2.973876953125, -2.8494873046875, -2.72509765625, -2.6007080078125, -2.476318359375, -2.3519287109375, -2.2275390625, -2.1031494140625, -1.978759765625, -1.8543701171875, -1.72998046875, -1.6055908203125, -1.481201171875, -1.3568115234375, -1.232421875, -1.1080322265625, -0.983642578125, -0.8592529296875, -0.73486328125, -0.6104736328125, -0.486083984375, -0.3616943359375, -0.2373046875, -0.1129150390625, 0.011474609375, 0.1358642578125, 0.26025390625, 0.3846435546875, 0.509033203125, 0.6334228515625, 0.7578125, 0.8822021484375, 1.006591796875, 1.1309814453125, 1.25537109375, 1.3797607421875, 1.504150390625, 1.6285400390625, 1.7529296875, 1.8773193359375, 2.001708984375, 2.1260986328125, 2.25048828125, 2.3748779296875, 2.499267578125, 2.6236572265625, 2.748046875, 2.8724365234375, 2.996826171875, 3.1212158203125, 3.24560546875, 3.3699951171875, 3.494384765625, 3.6187744140625, 3.7431640625, 3.8675537109375, 3.991943359375, 4.1163330078125, 4.24072265625, 4.3651123046875, 4.489501953125, 4.6138916015625, 4.73828125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 9.0, 8.0, 7.0, 9.0, 15.0, 26.0, 32.0, 48.0, 70.0, 95.0, 123.0, 167.0, 237.0, 338.0, 496.0, 739.0, 1094.0, 1665.0, 3382.0, 19995.0, 203257.0, 643476.0, 151008.0, 14445.0, 2866.0, 1548.0, 1069.0, 666.0, 514.0, 339.0, 224.0, 163.0, 140.0, 83.0, 64.0, 41.0, 28.0, 18.0, 14.0, 11.0, 7.0, 8.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0546875, -8.7666015625, -8.478515625, -8.1904296875, -7.90234375, -7.6142578125, -7.326171875, -7.0380859375, -6.75, -6.4619140625, -6.173828125, -5.8857421875, -5.59765625, -5.3095703125, -5.021484375, -4.7333984375, -4.4453125, -4.1572265625, -3.869140625, -3.5810546875, -3.29296875, -3.0048828125, -2.716796875, -2.4287109375, -2.140625, -1.8525390625, -1.564453125, -1.2763671875, -0.98828125, -0.7001953125, -0.412109375, -0.1240234375, 0.1640625, 0.4521484375, 0.740234375, 1.0283203125, 1.31640625, 1.6044921875, 1.892578125, 2.1806640625, 2.46875, 2.7568359375, 3.044921875, 3.3330078125, 3.62109375, 3.9091796875, 4.197265625, 4.4853515625, 4.7734375, 5.0615234375, 5.349609375, 5.6376953125, 5.92578125, 6.2138671875, 6.501953125, 6.7900390625, 7.078125, 7.3662109375, 7.654296875, 7.9423828125, 8.23046875, 8.5185546875, 8.806640625, 9.0947265625, 9.3828125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 7.0, 6.0, 3.0, 14.0, 13.0, 25.0, 22.0, 25.0, 31.0, 35.0, 35.0, 49.0, 41.0, 56.0, 99.0, 187.0, 1383.0, 357.0, 166.0, 74.0, 54.0, 45.0, 43.0, 43.0, 33.0, 33.0, 33.0, 18.0, 20.0, 24.0, 16.0, 11.0, 13.0, 6.0, 6.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.93359375, -8.625, -8.31640625, -8.0078125, -7.69921875, -7.390625, -7.08203125, -6.7734375, -6.46484375, -6.15625, -5.84765625, -5.5390625, -5.23046875, -4.921875, -4.61328125, -4.3046875, -3.99609375, -3.6875, -3.37890625, -3.0703125, -2.76171875, -2.453125, -2.14453125, -1.8359375, -1.52734375, -1.21875, -0.91015625, -0.6015625, -0.29296875, 0.015625, 0.32421875, 0.6328125, 0.94140625, 1.25, 1.55859375, 1.8671875, 2.17578125, 2.484375, 2.79296875, 3.1015625, 3.41015625, 3.71875, 4.02734375, 4.3359375, 4.64453125, 4.953125, 5.26171875, 5.5703125, 5.87890625, 6.1875, 6.49609375, 6.8046875, 7.11328125, 7.421875, 7.73046875, 8.0390625, 8.34765625, 8.65625, 8.96484375, 9.2734375, 9.58203125, 9.890625, 10.19921875, 10.5078125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 5.0, 6.0, 13.0, 15.0, 12.0, 13.0, 28.0, 48.0, 39.0, 73.0, 85.0, 124.0, 212.0, 326.0, 503.0, 983.0, 2631.0, 3111534.0, 25656.0, 1534.0, 678.0, 390.0, 252.0, 161.0, 114.0, 70.0, 45.0, 33.0, 31.0, 26.0, 17.0, 12.0, 11.0, 4.0, 5.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.375, -41.86669921875, -40.3583984375, -38.85009765625, -37.341796875, -35.83349609375, -34.3251953125, -32.81689453125, -31.30859375, -29.80029296875, -28.2919921875, -26.78369140625, -25.275390625, -23.76708984375, -22.2587890625, -20.75048828125, -19.2421875, -17.73388671875, -16.2255859375, -14.71728515625, -13.208984375, -11.70068359375, -10.1923828125, -8.68408203125, -7.17578125, -5.66748046875, -4.1591796875, -2.65087890625, -1.142578125, 0.36572265625, 1.8740234375, 3.38232421875, 4.890625, 6.39892578125, 7.9072265625, 9.41552734375, 10.923828125, 12.43212890625, 13.9404296875, 15.44873046875, 16.95703125, 18.46533203125, 19.9736328125, 21.48193359375, 22.990234375, 24.49853515625, 26.0068359375, 27.51513671875, 29.0234375, 30.53173828125, 32.0400390625, 33.54833984375, 35.056640625, 36.56494140625, 38.0732421875, 39.58154296875, 41.08984375, 42.59814453125, 44.1064453125, 45.61474609375, 47.123046875, 48.63134765625, 50.1396484375, 51.64794921875, 53.15625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 96.0, 623.0, 277.0, 16.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.67234802246094, -92.65572357177734, -89.63909912109375, -86.62247467041016, -83.60585021972656, -80.58922576904297, -77.57260131835938, -74.55597686767578, -71.53935241699219, -68.5227279663086, -65.506103515625, -62.489479064941406, -59.47285461425781, -56.45623016357422, -53.439605712890625, -50.42298126220703, -47.40635681152344, -44.389732360839844, -41.37310791015625, -38.356483459472656, -35.33985900878906, -32.32323455810547, -29.306610107421875, -26.28998565673828, -23.273361206054688, -20.256736755371094, -17.2401123046875, -14.223487854003906, -11.206863403320312, -8.190238952636719, -5.173614501953125, -2.1569900512695312, 0.8596343994140625, 3.8762588500976562, 6.89288330078125, 9.909507751464844, 12.926132202148438, 15.942756652832031, 18.959381103515625, 21.97600555419922, 24.992630004882812, 28.009254455566406, 31.02587890625, 34.042503356933594, 37.05912780761719, 40.07575225830078, 43.092376708984375, 46.10900115966797, 49.12562561035156, 52.142250061035156, 55.15887451171875, 58.175498962402344, 61.19212341308594, 64.20874786376953, 67.22537231445312, 70.24199676513672, 73.25862121582031, 76.2752456665039, 79.2918701171875, 82.3084945678711, 85.32511901855469, 88.34174346923828, 91.35836791992188, 94.37499237060547, 97.39161682128906]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 11.0, 7.0, 8.0, 12.0, 6.0, 13.0, 14.0, 12.0, 15.0, 20.0, 15.0, 22.0, 20.0, 31.0, 34.0, 27.0, 33.0, 38.0, 33.0, 40.0, 38.0, 32.0, 48.0, 37.0, 33.0, 36.0, 32.0, 39.0, 24.0, 28.0, 20.0, 19.0, 20.0, 26.0, 14.0, 20.0, 13.0, 22.0, 15.0, 14.0, 9.0, 13.0, 10.0, 5.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.73282241821289, -19.054611206054688, -18.376399993896484, -17.69818878173828, -17.01997947692871, -16.341768264770508, -15.663557052612305, -14.985345840454102, -14.307135581970215, -13.628924369812012, -12.950714111328125, -12.272502899169922, -11.594291687011719, -10.916081428527832, -10.237870216369629, -9.559659957885742, -8.881448745727539, -8.203237533569336, -7.525027275085449, -6.846816062927246, -6.168605327606201, -5.490394592285156, -4.812183380126953, -4.133972644805908, -3.4557619094848633, -2.7775511741638184, -2.0993402004241943, -1.4211292266845703, -0.7429184913635254, -0.06470775604248047, 0.6135034561157227, 1.2917141914367676, 1.9699249267578125, 2.6481356620788574, 3.3263466358184814, 4.0045576095581055, 4.68276834487915, 5.360979080200195, 6.039190292358398, 6.717401027679443, 7.395611763000488, 8.073822975158691, 8.752033233642578, 9.430244445800781, 10.108455657958984, 10.786665916442871, 11.464877128601074, 12.143087387084961, 12.821298599243164, 13.499509811401367, 14.177720069885254, 14.855931282043457, 15.534141540527344, 16.212352752685547, 16.89056396484375, 17.568775177001953, 18.246986389160156, 18.92519760131836, 19.603408813476562, 20.281620025634766, 20.959829330444336, 21.63804054260254, 22.316251754760742, 22.994462966918945, 23.672672271728516]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 10.0, 8.0, 12.0, 10.0, 14.0, 15.0, 26.0, 23.0, 20.0, 16.0, 29.0, 31.0, 44.0, 35.0, 30.0, 37.0, 41.0, 32.0, 41.0, 37.0, 38.0, 61.0, 24.0, 36.0, 37.0, 31.0, 34.0, 35.0, 23.0, 25.0, 20.0, 22.0, 19.0, 8.0, 9.0, 7.0, 6.0, 5.0, 3.0, 8.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.482421875, -3.370849609375, -3.25927734375, -3.147705078125, -3.0361328125, -2.924560546875, -2.81298828125, -2.701416015625, -2.58984375, -2.478271484375, -2.36669921875, -2.255126953125, -2.1435546875, -2.031982421875, -1.92041015625, -1.808837890625, -1.697265625, -1.585693359375, -1.47412109375, -1.362548828125, -1.2509765625, -1.139404296875, -1.02783203125, -0.916259765625, -0.8046875, -0.693115234375, -0.58154296875, -0.469970703125, -0.3583984375, -0.246826171875, -0.13525390625, -0.023681640625, 0.087890625, 0.199462890625, 0.31103515625, 0.422607421875, 0.5341796875, 0.645751953125, 0.75732421875, 0.868896484375, 0.98046875, 1.092041015625, 1.20361328125, 1.315185546875, 1.4267578125, 1.538330078125, 1.64990234375, 1.761474609375, 1.873046875, 1.984619140625, 2.09619140625, 2.207763671875, 2.3193359375, 2.430908203125, 2.54248046875, 2.654052734375, 2.765625, 2.877197265625, 2.98876953125, 3.100341796875, 3.2119140625, 3.323486328125, 3.43505859375, 3.546630859375, 3.658203125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 8.0, 8.0, 14.0, 21.0, 23.0, 36.0, 40.0, 63.0, 70.0, 96.0, 138.0, 218.0, 345.0, 708.0, 1697.0, 4722.0, 20872.0, 132152.0, 822998.0, 2181145.0, 864629.0, 134618.0, 21203.0, 5083.0, 1576.0, 680.0, 356.0, 226.0, 128.0, 99.0, 61.0, 67.0, 33.0, 32.0, 25.0, 25.0, 14.0, 20.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40625, -5.20233154296875, -4.9984130859375, -4.79449462890625, -4.590576171875, -4.38665771484375, -4.1827392578125, -3.97882080078125, -3.77490234375, -3.57098388671875, -3.3670654296875, -3.16314697265625, -2.959228515625, -2.75531005859375, -2.5513916015625, -2.34747314453125, -2.1435546875, -1.93963623046875, -1.7357177734375, -1.53179931640625, -1.327880859375, -1.12396240234375, -0.9200439453125, -0.71612548828125, -0.51220703125, -0.30828857421875, -0.1043701171875, 0.09954833984375, 0.303466796875, 0.50738525390625, 0.7113037109375, 0.91522216796875, 1.119140625, 1.32305908203125, 1.5269775390625, 1.73089599609375, 1.934814453125, 2.13873291015625, 2.3426513671875, 2.54656982421875, 2.75048828125, 2.95440673828125, 3.1583251953125, 3.36224365234375, 3.566162109375, 3.77008056640625, 3.9739990234375, 4.17791748046875, 4.3818359375, 4.58575439453125, 4.7896728515625, 4.99359130859375, 5.197509765625, 5.40142822265625, 5.6053466796875, 5.80926513671875, 6.01318359375, 6.21710205078125, 6.4210205078125, 6.62493896484375, 6.828857421875, 7.03277587890625, 7.2366943359375, 7.44061279296875, 7.64453125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 9.0, 6.0, 6.0, 8.0, 15.0, 17.0, 28.0, 26.0, 42.0, 60.0, 74.0, 102.0, 139.0, 170.0, 209.0, 304.0, 411.0, 483.0, 467.0, 379.0, 258.0, 201.0, 120.0, 112.0, 104.0, 69.0, 43.0, 37.0, 41.0, 37.0, 25.0, 26.0, 10.0, 8.0, 5.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.18121337890625, -4.9796142578125, -4.77801513671875, -4.576416015625, -4.37481689453125, -4.1732177734375, -3.97161865234375, -3.77001953125, -3.56842041015625, -3.3668212890625, -3.16522216796875, -2.963623046875, -2.76202392578125, -2.5604248046875, -2.35882568359375, -2.1572265625, -1.95562744140625, -1.7540283203125, -1.55242919921875, -1.350830078125, -1.14923095703125, -0.9476318359375, -0.74603271484375, -0.54443359375, -0.34283447265625, -0.1412353515625, 0.06036376953125, 0.261962890625, 0.46356201171875, 0.6651611328125, 0.86676025390625, 1.068359375, 1.26995849609375, 1.4715576171875, 1.67315673828125, 1.874755859375, 2.07635498046875, 2.2779541015625, 2.47955322265625, 2.68115234375, 2.88275146484375, 3.0843505859375, 3.28594970703125, 3.487548828125, 3.68914794921875, 3.8907470703125, 4.09234619140625, 4.2939453125, 4.49554443359375, 4.6971435546875, 4.89874267578125, 5.100341796875, 5.30194091796875, 5.5035400390625, 5.70513916015625, 5.90673828125, 6.10833740234375, 6.3099365234375, 6.51153564453125, 6.713134765625, 6.91473388671875, 7.1163330078125, 7.31793212890625, 7.51953125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 17.0, 29.0, 68.0, 130.0, 218.0, 453.0, 1042.0, 3322.0, 77903.0, 3900632.0, 203974.0, 4366.0, 1177.0, 467.0, 227.0, 114.0, 54.0, 33.0, 15.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.28125, -26.609130859375, -25.93701171875, -25.264892578125, -24.5927734375, -23.920654296875, -23.24853515625, -22.576416015625, -21.904296875, -21.232177734375, -20.56005859375, -19.887939453125, -19.2158203125, -18.543701171875, -17.87158203125, -17.199462890625, -16.52734375, -15.855224609375, -15.18310546875, -14.510986328125, -13.8388671875, -13.166748046875, -12.49462890625, -11.822509765625, -11.150390625, -10.478271484375, -9.80615234375, -9.134033203125, -8.4619140625, -7.789794921875, -7.11767578125, -6.445556640625, -5.7734375, -5.101318359375, -4.42919921875, -3.757080078125, -3.0849609375, -2.412841796875, -1.74072265625, -1.068603515625, -0.396484375, 0.275634765625, 0.94775390625, 1.619873046875, 2.2919921875, 2.964111328125, 3.63623046875, 4.308349609375, 4.98046875, 5.652587890625, 6.32470703125, 6.996826171875, 7.6689453125, 8.341064453125, 9.01318359375, 9.685302734375, 10.357421875, 11.029541015625, 11.70166015625, 12.373779296875, 13.0458984375, 13.718017578125, 14.39013671875, 15.062255859375, 15.734375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 21.0, 670.0, 321.0, 4.0, 1.0, 1.0, 1.0], "bins": [-442.0586853027344, -434.54180908203125, -427.0249328613281, -419.5080871582031, -411.9912109375, -404.4743347167969, -396.95745849609375, -389.44061279296875, -381.9237365722656, -374.4068603515625, -366.8899841308594, -359.3731384277344, -351.85626220703125, -344.3393859863281, -336.822509765625, -329.3056640625, -321.78875732421875, -314.2718811035156, -306.7550048828125, -299.2381591796875, -291.7212829589844, -284.20440673828125, -276.6875305175781, -269.170654296875, -261.65380859375, -254.13693237304688, -246.6200714111328, -239.1031951904297, -231.58633422851562, -224.0694580078125, -216.55258178710938, -209.0357208251953, -201.5188446044922, -194.00196838378906, -186.485107421875, -178.96823120117188, -171.4513702392578, -163.9344940185547, -156.41763305664062, -148.9007568359375, -141.38389587402344, -133.8670196533203, -126.35015869140625, -118.83328247070312, -111.31642150878906, -103.79954528808594, -96.28267669677734, -88.76580810546875, -81.24893188476562, -73.73206329345703, -66.21519470214844, -58.69832229614258, -51.181453704833984, -43.66458511352539, -36.14771270751953, -28.630844116210938, -21.11397933959961, -13.5971097946167, -6.080240249633789, 1.4366302490234375, 8.953498840332031, 16.470367431640625, 23.987239837646484, 31.504108428955078, 39.02097702026367]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 3.0, 4.0, 8.0, 4.0, 8.0, 8.0, 17.0, 12.0, 20.0, 27.0, 18.0, 34.0, 28.0, 19.0, 32.0, 38.0, 36.0, 46.0, 41.0, 40.0, 40.0, 42.0, 45.0, 36.0, 53.0, 36.0, 30.0, 38.0, 33.0, 31.0, 30.0, 25.0, 20.0, 22.0, 9.0, 16.0, 8.0, 12.0, 7.0, 10.0, 7.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.018861770629883, -22.141508102416992, -21.264156341552734, -20.386802673339844, -19.509449005126953, -18.632095336914062, -17.754741668701172, -16.877389907836914, -16.000036239624023, -15.122682571411133, -14.245329856872559, -13.367977142333984, -12.490623474121094, -11.613269805908203, -10.735917091369629, -9.858564376831055, -8.981210708618164, -8.103857040405273, -7.226504325866699, -6.349151134490967, -5.471797943115234, -4.594444751739502, -3.7170915603637695, -2.839738368988037, -1.9623851776123047, -1.0850319862365723, -0.20767879486083984, 0.6696743965148926, 1.547027587890625, 2.4243807792663574, 3.30173397064209, 4.179087162017822, 5.056438446044922, 5.933791637420654, 6.811144828796387, 7.688498020172119, 8.565851211547852, 9.443204879760742, 10.320557594299316, 11.19791030883789, 12.075263977050781, 12.952617645263672, 13.829970359802246, 14.70732307434082, 15.584676742553711, 16.4620304107666, 17.33938217163086, 18.21673583984375, 19.09408950805664, 19.97144317626953, 20.848796844482422, 21.72614860534668, 22.60350227355957, 23.48085594177246, 24.35820770263672, 25.23556137084961, 26.1129150390625, 26.99026870727539, 27.86762237548828, 28.74497413635254, 29.62232780456543, 30.49968147277832, 31.377033233642578, 32.25438690185547, 33.13174057006836]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 8.0, 7.0, 22.0, 19.0, 16.0, 17.0, 33.0, 28.0, 44.0, 35.0, 43.0, 44.0, 35.0, 47.0, 37.0, 39.0, 43.0, 46.0, 47.0, 48.0, 41.0, 37.0, 36.0, 31.0, 30.0, 28.0, 24.0, 19.0, 22.0, 9.0, 17.0, 18.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.120361328125, -3.01611328125, -2.911865234375, -2.8076171875, -2.703369140625, -2.59912109375, -2.494873046875, -2.390625, -2.286376953125, -2.18212890625, -2.077880859375, -1.9736328125, -1.869384765625, -1.76513671875, -1.660888671875, -1.556640625, -1.452392578125, -1.34814453125, -1.243896484375, -1.1396484375, -1.035400390625, -0.93115234375, -0.826904296875, -0.72265625, -0.618408203125, -0.51416015625, -0.409912109375, -0.3056640625, -0.201416015625, -0.09716796875, 0.007080078125, 0.111328125, 0.215576171875, 0.31982421875, 0.424072265625, 0.5283203125, 0.632568359375, 0.73681640625, 0.841064453125, 0.9453125, 1.049560546875, 1.15380859375, 1.258056640625, 1.3623046875, 1.466552734375, 1.57080078125, 1.675048828125, 1.779296875, 1.883544921875, 1.98779296875, 2.092041015625, 2.1962890625, 2.300537109375, 2.40478515625, 2.509033203125, 2.61328125, 2.717529296875, 2.82177734375, 2.926025390625, 3.0302734375, 3.134521484375, 3.23876953125, 3.343017578125, 3.447265625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 22.0, 22.0, 36.0, 56.0, 81.0, 116.0, 189.0, 295.0, 469.0, 914.0, 1626.0, 2999.0, 5347.0, 10448.0, 20379.0, 39735.0, 81972.0, 197362.0, 377599.0, 164137.0, 71598.0, 34877.0, 17890.0, 9360.0, 4921.0, 2665.0, 1437.0, 830.0, 441.0, 259.0, 153.0, 103.0, 74.0, 43.0, 24.0, 18.0, 18.0, 8.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7568359375, -0.7334823608398438, -0.7101287841796875, -0.6867752075195312, -0.663421630859375, -0.6400680541992188, -0.6167144775390625, -0.5933609008789062, -0.57000732421875, -0.5466537475585938, -0.5233001708984375, -0.49994659423828125, -0.476593017578125, -0.45323944091796875, -0.4298858642578125, -0.40653228759765625, -0.3831787109375, -0.35982513427734375, -0.3364715576171875, -0.31311798095703125, -0.289764404296875, -0.26641082763671875, -0.2430572509765625, -0.21970367431640625, -0.19635009765625, -0.17299652099609375, -0.1496429443359375, -0.12628936767578125, -0.102935791015625, -0.07958221435546875, -0.0562286376953125, -0.03287506103515625, -0.009521484375, 0.01383209228515625, 0.0371856689453125, 0.06053924560546875, 0.083892822265625, 0.10724639892578125, 0.1305999755859375, 0.15395355224609375, 0.17730712890625, 0.20066070556640625, 0.2240142822265625, 0.24736785888671875, 0.270721435546875, 0.29407501220703125, 0.3174285888671875, 0.34078216552734375, 0.3641357421875, 0.38748931884765625, 0.4108428955078125, 0.43419647216796875, 0.457550048828125, 0.48090362548828125, 0.5042572021484375, 0.5276107788085938, 0.55096435546875, 0.5743179321289062, 0.5976715087890625, 0.6210250854492188, 0.644378662109375, 0.6677322387695312, 0.6910858154296875, 0.7144393920898438, 0.73779296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 10.0, 9.0, 4.0, 8.0, 13.0, 12.0, 15.0, 9.0, 23.0, 20.0, 24.0, 28.0, 31.0, 29.0, 27.0, 37.0, 33.0, 34.0, 33.0, 30.0, 43.0, 1061.0, 37.0, 36.0, 39.0, 41.0, 28.0, 30.0, 42.0, 23.0, 31.0, 22.0, 21.0, 20.0, 17.0, 15.0, 24.0, 13.0, 9.0, 8.0, 4.0, 9.0, 5.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8125, -1.7574005126953125, -1.702301025390625, -1.6472015380859375, -1.59210205078125, -1.5370025634765625, -1.481903076171875, -1.4268035888671875, -1.3717041015625, -1.3166046142578125, -1.261505126953125, -1.2064056396484375, -1.15130615234375, -1.0962066650390625, -1.041107177734375, -0.9860076904296875, -0.930908203125, -0.8758087158203125, -0.820709228515625, -0.7656097412109375, -0.71051025390625, -0.6554107666015625, -0.600311279296875, -0.5452117919921875, -0.4901123046875, -0.4350128173828125, -0.379913330078125, -0.3248138427734375, -0.26971435546875, -0.2146148681640625, -0.159515380859375, -0.1044158935546875, -0.04931640625, 0.0057830810546875, 0.060882568359375, 0.1159820556640625, 0.17108154296875, 0.2261810302734375, 0.281280517578125, 0.3363800048828125, 0.3914794921875, 0.4465789794921875, 0.501678466796875, 0.5567779541015625, 0.61187744140625, 0.6669769287109375, 0.722076416015625, 0.7771759033203125, 0.832275390625, 0.8873748779296875, 0.942474365234375, 0.9975738525390625, 1.05267333984375, 1.1077728271484375, 1.162872314453125, 1.2179718017578125, 1.2730712890625, 1.3281707763671875, 1.383270263671875, 1.4383697509765625, 1.49346923828125, 1.5485687255859375, 1.603668212890625, 1.6587677001953125, 1.7138671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 7.0, 11.0, 18.0, 28.0, 49.0, 65.0, 78.0, 138.0, 161.0, 286.0, 336.0, 520.0, 763.0, 1093.0, 1615.0, 2277.0, 3334.0, 4879.0, 7418.0, 10953.0, 17045.0, 26284.0, 42322.0, 69424.0, 124134.0, 1310190.0, 207712.0, 101709.0, 59334.0, 36393.0, 23016.0, 15004.0, 9754.0, 6582.0, 4515.0, 3013.0, 2109.0, 1421.0, 969.0, 687.0, 488.0, 319.0, 218.0, 157.0, 109.0, 59.0, 42.0, 32.0, 27.0, 13.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.499755859375, -0.4845390319824219, -0.46932220458984375, -0.4541053771972656, -0.4388885498046875, -0.4236717224121094, -0.40845489501953125, -0.3932380676269531, -0.378021240234375, -0.3628044128417969, -0.34758758544921875, -0.3323707580566406, -0.3171539306640625, -0.3019371032714844, -0.28672027587890625, -0.2715034484863281, -0.25628662109375, -0.24106979370117188, -0.22585296630859375, -0.21063613891601562, -0.1954193115234375, -0.18020248413085938, -0.16498565673828125, -0.14976882934570312, -0.134552001953125, -0.11933517456054688, -0.10411834716796875, -0.08890151977539062, -0.0736846923828125, -0.058467864990234375, -0.04325103759765625, -0.028034210205078125, -0.0128173828125, 0.002399444580078125, 0.01761627197265625, 0.032833099365234375, 0.0480499267578125, 0.06326675415039062, 0.07848358154296875, 0.09370040893554688, 0.108917236328125, 0.12413406372070312, 0.13935089111328125, 0.15456771850585938, 0.1697845458984375, 0.18500137329101562, 0.20021820068359375, 0.21543502807617188, 0.23065185546875, 0.24586868286132812, 0.26108551025390625, 0.2763023376464844, 0.2915191650390625, 0.3067359924316406, 0.32195281982421875, 0.3371696472167969, 0.352386474609375, 0.3676033020019531, 0.38282012939453125, 0.3980369567871094, 0.4132537841796875, 0.4284706115722656, 0.44368743896484375, 0.4589042663574219, 0.47412109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 4.0, 9.0, 11.0, 12.0, 14.0, 11.0, 14.0, 23.0, 27.0, 22.0, 36.0, 42.0, 41.0, 45.0, 51.0, 37.0, 57.0, 57.0, 65.0, 46.0, 57.0, 49.0, 34.0, 35.0, 34.0, 25.0, 23.0, 11.0, 17.0, 14.0, 16.0, 11.0, 9.0, 7.0, 10.0, 2.0, 2.0, 3.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003428459167480469, -0.00033260881900787354, -0.0003223717212677002, -0.00031213462352752686, -0.0003018975257873535, -0.0002916604280471802, -0.00028142333030700684, -0.0002711862325668335, -0.00026094913482666016, -0.0002507120370864868, -0.00024047493934631348, -0.00023023784160614014, -0.0002200007438659668, -0.00020976364612579346, -0.00019952654838562012, -0.00018928945064544678, -0.00017905235290527344, -0.0001688152551651001, -0.00015857815742492676, -0.00014834105968475342, -0.00013810396194458008, -0.00012786686420440674, -0.0001176297664642334, -0.00010739266872406006, -9.715557098388672e-05, -8.691847324371338e-05, -7.668137550354004e-05, -6.64442777633667e-05, -5.620718002319336e-05, -4.597008228302002e-05, -3.573298454284668e-05, -2.549588680267334e-05, -1.52587890625e-05, -5.02169132232666e-06, 5.21540641784668e-06, 1.545250415802002e-05, 2.568960189819336e-05, 3.59266996383667e-05, 4.616379737854004e-05, 5.640089511871338e-05, 6.663799285888672e-05, 7.687509059906006e-05, 8.71121883392334e-05, 9.734928607940674e-05, 0.00010758638381958008, 0.00011782348155975342, 0.00012806057929992676, 0.0001382976770401001, 0.00014853477478027344, 0.00015877187252044678, 0.00016900897026062012, 0.00017924606800079346, 0.0001894831657409668, 0.00019972026348114014, 0.00020995736122131348, 0.00022019445896148682, 0.00023043155670166016, 0.0002406686544418335, 0.00025090575218200684, 0.0002611428499221802, 0.0002713799476623535, 0.00028161704540252686, 0.0002918541431427002, 0.00030209124088287354, 0.0003123283386230469]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 2.0, 12.0, 11.0, 8.0, 29.0, 32.0, 30.0, 45.0, 53.0, 53.0, 50.0, 128.0, 155.0, 233.0, 327.0, 545.0, 931.0, 8711.0, 1024078.0, 10307.0, 972.0, 542.0, 363.0, 242.0, 175.0, 121.0, 78.0, 62.0, 39.0, 39.0, 26.0, 38.0, 26.0, 11.0, 18.0, 9.0, 11.0, 7.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006000518798828125, -0.005810141563415527, -0.00561976432800293, -0.005429387092590332, -0.005239009857177734, -0.005048632621765137, -0.004858255386352539, -0.004667878150939941, -0.004477500915527344, -0.004287123680114746, -0.0040967464447021484, -0.003906369209289551, -0.003715991973876953, -0.0035256147384643555, -0.003335237503051758, -0.00314486026763916, -0.0029544830322265625, -0.002764105796813965, -0.002573728561401367, -0.0023833513259887695, -0.002192974090576172, -0.0020025968551635742, -0.0018122196197509766, -0.001621842384338379, -0.0014314651489257812, -0.0012410879135131836, -0.001050710678100586, -0.0008603334426879883, -0.0006699562072753906, -0.00047957897186279297, -0.0002892017364501953, -9.882450103759766e-05, 9.1552734375e-05, 0.00028192996978759766, 0.0004723072052001953, 0.000662684440612793, 0.0008530616760253906, 0.0010434389114379883, 0.001233816146850586, 0.0014241933822631836, 0.0016145706176757812, 0.001804947853088379, 0.0019953250885009766, 0.0021857023239135742, 0.002376079559326172, 0.0025664567947387695, 0.002756834030151367, 0.002947211265563965, 0.0031375885009765625, 0.00332796573638916, 0.003518342971801758, 0.0037087202072143555, 0.003899097442626953, 0.004089474678039551, 0.0042798519134521484, 0.004470229148864746, 0.004660606384277344, 0.004850983619689941, 0.005041360855102539, 0.005231738090515137, 0.005422115325927734, 0.005612492561340332, 0.00580286979675293, 0.005993247032165527, 0.006183624267578125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 22.0, 178.0, 537.0, 247.0, 28.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006031366647221148, -0.0005752437864430249, -0.0005473509663715959, -0.0005194580880925059, -0.0004915652680210769, -0.000463672389741987, -0.0004357795405667275, -0.00040788669139146805, -0.0003799938422162086, -0.0003521009930409491, -0.00032420814386568964, -0.00029631529469043016, -0.00026842241641134024, -0.000240529581787996, -0.0002126367180608213, -0.00018474386888556182, -0.00015685101971030235, -0.00012895817053504288, -0.0001010653140838258, -7.317245763260871e-05, -4.527960845734924e-05, -1.738675928208977e-05, 1.050610444508493e-05, 3.83989536203444e-05, 6.629180279560387e-05, 9.418465197086334e-05, 0.0001220775011461228, 0.0001499703648732975, 0.00017786321404855698, 0.00020575606322381645, 0.00023364892695099115, 0.0002615417761262506, 0.000289434683509171, 0.0003173275326844305, 0.00034522038185968995, 0.0003731132601387799, 0.0004010060802102089, 0.0004288989584892988, 0.0004567918076645583, 0.00048468465683981776, 0.0005125774769112468, 0.0005404703551903367, 0.0005683631752617657, 0.0005962560535408556, 0.0006241488736122847, 0.0006520417518913746, 0.0006799346301704645, 0.0007078274502418935, 0.0007357203285209835, 0.0007636132068000734, 0.0007915060268715024, 0.0008193989051505923, 0.0008472917252220213, 0.0008751846035011113, 0.0009030774235725403, 0.0009309703018516302, 0.0009588631801307201, 0.00098675605840981, 0.0010146489366889, 0.001042541698552668, 0.001070434576831758, 0.001098327455110848, 0.0011262203333899379, 0.001154113095253706, 0.001182005973532796]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 10.0, 5.0, 10.0, 11.0, 8.0, 12.0, 12.0, 24.0, 20.0, 32.0, 20.0, 29.0, 30.0, 28.0, 44.0, 31.0, 32.0, 41.0, 38.0, 44.0, 36.0, 40.0, 34.0, 37.0, 40.0, 48.0, 29.0, 29.0, 37.0, 26.0, 23.0, 21.0, 21.0, 12.0, 8.0, 14.0, 13.0, 14.0, 7.0, 9.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00020492076873779297, -0.0001990925520658493, -0.00019326433539390564, -0.00018743611872196198, -0.0001816079020500183, -0.00017577968537807465, -0.00016995146870613098, -0.00016412325203418732, -0.00015829503536224365, -0.0001524668186903, -0.00014663860201835632, -0.00014081038534641266, -0.000134982168674469, -0.00012915395200252533, -0.00012332573533058167, -0.000117497518658638, -0.00011166930198669434, -0.00010584108531475067, -0.00010001286864280701, -9.418465197086334e-05, -8.835643529891968e-05, -8.252821862697601e-05, -7.670000195503235e-05, -7.087178528308868e-05, -6.504356861114502e-05, -5.9215351939201355e-05, -5.338713526725769e-05, -4.7558918595314026e-05, -4.173070192337036e-05, -3.59024852514267e-05, -3.0074268579483032e-05, -2.4246051907539368e-05, -1.8417835235595703e-05, -1.2589618563652039e-05, -6.761401891708374e-06, -9.331852197647095e-07, 4.895031452178955e-06, 1.072324812412262e-05, 1.6551464796066284e-05, 2.237968146800995e-05, 2.8207898139953613e-05, 3.403611481189728e-05, 3.986433148384094e-05, 4.569254815578461e-05, 5.152076482772827e-05, 5.7348981499671936e-05, 6.31771981716156e-05, 6.900541484355927e-05, 7.483363151550293e-05, 8.06618481874466e-05, 8.649006485939026e-05, 9.231828153133392e-05, 9.814649820327759e-05, 0.00010397471487522125, 0.00010980293154716492, 0.00011563114821910858, 0.00012145936489105225, 0.0001272875815629959, 0.00013311579823493958, 0.00013894401490688324, 0.0001447722315788269, 0.00015060044825077057, 0.00015642866492271423, 0.0001622568815946579, 0.00016808509826660156]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 8.0, 7.0, 22.0, 19.0, 16.0, 17.0, 33.0, 28.0, 44.0, 35.0, 43.0, 44.0, 35.0, 47.0, 37.0, 39.0, 43.0, 46.0, 47.0, 48.0, 41.0, 37.0, 36.0, 31.0, 30.0, 28.0, 24.0, 19.0, 22.0, 9.0, 17.0, 18.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.120361328125, -3.01611328125, -2.911865234375, -2.8076171875, -2.703369140625, -2.59912109375, -2.494873046875, -2.390625, -2.286376953125, -2.18212890625, -2.077880859375, -1.9736328125, -1.869384765625, -1.76513671875, -1.660888671875, -1.556640625, -1.452392578125, -1.34814453125, -1.243896484375, -1.1396484375, -1.035400390625, -0.93115234375, -0.826904296875, -0.72265625, -0.618408203125, -0.51416015625, -0.409912109375, -0.3056640625, -0.201416015625, -0.09716796875, 0.007080078125, 0.111328125, 0.215576171875, 0.31982421875, 0.424072265625, 0.5283203125, 0.632568359375, 0.73681640625, 0.841064453125, 0.9453125, 1.049560546875, 1.15380859375, 1.258056640625, 1.3623046875, 1.466552734375, 1.57080078125, 1.675048828125, 1.779296875, 1.883544921875, 1.98779296875, 2.092041015625, 2.1962890625, 2.300537109375, 2.40478515625, 2.509033203125, 2.61328125, 2.717529296875, 2.82177734375, 2.926025390625, 3.0302734375, 3.134521484375, 3.23876953125, 3.343017578125, 3.447265625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 10.0, 17.0, 18.0, 29.0, 45.0, 63.0, 97.0, 143.0, 173.0, 244.0, 349.0, 455.0, 707.0, 893.0, 1383.0, 2008.0, 3137.0, 5821.0, 27725.0, 362120.0, 577609.0, 47385.0, 7361.0, 3504.0, 2227.0, 1514.0, 993.0, 747.0, 506.0, 356.0, 276.0, 184.0, 154.0, 82.0, 72.0, 42.0, 34.0, 24.0, 15.0, 11.0, 0.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.75, -8.4857177734375, -8.221435546875, -7.9571533203125, -7.69287109375, -7.4285888671875, -7.164306640625, -6.9000244140625, -6.6357421875, -6.3714599609375, -6.107177734375, -5.8428955078125, -5.57861328125, -5.3143310546875, -5.050048828125, -4.7857666015625, -4.521484375, -4.2572021484375, -3.992919921875, -3.7286376953125, -3.46435546875, -3.2000732421875, -2.935791015625, -2.6715087890625, -2.4072265625, -2.1429443359375, -1.878662109375, -1.6143798828125, -1.35009765625, -1.0858154296875, -0.821533203125, -0.5572509765625, -0.29296875, -0.0286865234375, 0.235595703125, 0.4998779296875, 0.76416015625, 1.0284423828125, 1.292724609375, 1.5570068359375, 1.8212890625, 2.0855712890625, 2.349853515625, 2.6141357421875, 2.87841796875, 3.1427001953125, 3.406982421875, 3.6712646484375, 3.935546875, 4.1998291015625, 4.464111328125, 4.7283935546875, 4.99267578125, 5.2569580078125, 5.521240234375, 5.7855224609375, 6.0498046875, 6.3140869140625, 6.578369140625, 6.8426513671875, 7.10693359375, 7.3712158203125, 7.635498046875, 7.8997802734375, 8.1640625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 6.0, 9.0, 18.0, 16.0, 16.0, 31.0, 39.0, 30.0, 40.0, 56.0, 59.0, 73.0, 151.0, 1556.0, 408.0, 143.0, 59.0, 51.0, 51.0, 35.0, 34.0, 32.0, 21.0, 22.0, 17.0, 12.0, 8.0, 7.0, 7.0, 7.0, 8.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.8170166015625, -9.509033203125, -9.2010498046875, -8.89306640625, -8.5850830078125, -8.277099609375, -7.9691162109375, -7.6611328125, -7.3531494140625, -7.045166015625, -6.7371826171875, -6.42919921875, -6.1212158203125, -5.813232421875, -5.5052490234375, -5.197265625, -4.8892822265625, -4.581298828125, -4.2733154296875, -3.96533203125, -3.6573486328125, -3.349365234375, -3.0413818359375, -2.7333984375, -2.4254150390625, -2.117431640625, -1.8094482421875, -1.50146484375, -1.1934814453125, -0.885498046875, -0.5775146484375, -0.26953125, 0.0384521484375, 0.346435546875, 0.6544189453125, 0.96240234375, 1.2703857421875, 1.578369140625, 1.8863525390625, 2.1943359375, 2.5023193359375, 2.810302734375, 3.1182861328125, 3.42626953125, 3.7342529296875, 4.042236328125, 4.3502197265625, 4.658203125, 4.9661865234375, 5.274169921875, 5.5821533203125, 5.89013671875, 6.1981201171875, 6.506103515625, 6.8140869140625, 7.1220703125, 7.4300537109375, 7.738037109375, 8.0460205078125, 8.35400390625, 8.6619873046875, 8.969970703125, 9.2779541015625, 9.5859375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 4.0, 8.0, 3.0, 10.0, 16.0, 11.0, 29.0, 24.0, 51.0, 97.0, 129.0, 211.0, 361.0, 746.0, 2077.0, 2858284.0, 280134.0, 1874.0, 700.0, 345.0, 222.0, 108.0, 90.0, 42.0, 39.0, 26.0, 22.0, 11.0, 8.0, 4.0, 2.0, 1.0, 6.0, 2.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.0625, -41.6708984375, -40.279296875, -38.8876953125, -37.49609375, -36.1044921875, -34.712890625, -33.3212890625, -31.9296875, -30.5380859375, -29.146484375, -27.7548828125, -26.36328125, -24.9716796875, -23.580078125, -22.1884765625, -20.796875, -19.4052734375, -18.013671875, -16.6220703125, -15.23046875, -13.8388671875, -12.447265625, -11.0556640625, -9.6640625, -8.2724609375, -6.880859375, -5.4892578125, -4.09765625, -2.7060546875, -1.314453125, 0.0771484375, 1.46875, 2.8603515625, 4.251953125, 5.6435546875, 7.03515625, 8.4267578125, 9.818359375, 11.2099609375, 12.6015625, 13.9931640625, 15.384765625, 16.7763671875, 18.16796875, 19.5595703125, 20.951171875, 22.3427734375, 23.734375, 25.1259765625, 26.517578125, 27.9091796875, 29.30078125, 30.6923828125, 32.083984375, 33.4755859375, 34.8671875, 36.2587890625, 37.650390625, 39.0419921875, 40.43359375, 41.8251953125, 43.216796875, 44.6083984375, 46.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 18.0, 181.0, 554.0, 224.0, 31.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.19784545898438, -140.66525268554688, -138.13265991210938, -135.6000518798828, -133.0674591064453, -130.5348663330078, -128.00225830078125, -125.46966552734375, -122.93707275390625, -120.40447998046875, -117.87187957763672, -115.33927917480469, -112.80668640136719, -110.27409362792969, -107.74149322509766, -105.20889282226562, -102.67630004882812, -100.14370727539062, -97.6111068725586, -95.07850646972656, -92.54591369628906, -90.01332092285156, -87.48072052001953, -84.9481201171875, -82.41552734375, -79.8829345703125, -77.35033416748047, -74.81773376464844, -72.28514099121094, -69.75254821777344, -67.2199478149414, -64.68734741210938, -62.15475082397461, -59.622154235839844, -57.08955764770508, -54.55696105957031, -52.02436447143555, -49.49176788330078, -46.959171295166016, -44.42657470703125, -41.893978118896484, -39.36138153076172, -36.82878494262695, -34.29618835449219, -31.763591766357422, -29.230995178222656, -26.69839859008789, -24.165802001953125, -21.63320541381836, -19.100608825683594, -16.568012237548828, -14.035415649414062, -11.502819061279297, -8.970222473144531, -6.437625885009766, -3.905029296875, -1.3724327087402344, 1.1601638793945312, 3.692760467529297, 6.2253570556640625, 8.757953643798828, 11.290550231933594, 13.82314682006836, 16.355743408203125, 18.88833999633789]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 2.0, 7.0, 8.0, 12.0, 11.0, 19.0, 18.0, 19.0, 21.0, 27.0, 31.0, 28.0, 35.0, 28.0, 36.0, 33.0, 41.0, 37.0, 39.0, 48.0, 48.0, 48.0, 51.0, 42.0, 33.0, 36.0, 40.0, 25.0, 27.0, 27.0, 16.0, 12.0, 21.0, 18.0, 8.0, 14.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-30.263473510742188, -29.354202270507812, -28.444929122924805, -27.53565788269043, -26.626384735107422, -25.717113494873047, -24.807842254638672, -23.898571014404297, -22.98929786682129, -22.080026626586914, -21.170753479003906, -20.26148223876953, -19.352210998535156, -18.44293785095215, -17.533666610717773, -16.624393463134766, -15.71512222290039, -14.8058500289917, -13.896577835083008, -12.987306594848633, -12.078034400939941, -11.16876220703125, -10.259490966796875, -9.350218772888184, -8.440946578979492, -7.531674385070801, -6.622402667999268, -5.713130950927734, -4.803858757019043, -3.8945865631103516, -2.9853148460388184, -2.076043128967285, -1.166769027709961, -0.25749707221984863, 0.6517748832702637, 1.561046838760376, 2.4703187942504883, 3.3795909881591797, 4.288862705230713, 5.198134422302246, 6.1074066162109375, 7.016678810119629, 7.925950527191162, 8.835222244262695, 9.744494438171387, 10.653766632080078, 11.563037872314453, 12.472310066223145, 13.381582260131836, 14.290854454040527, 15.200126647949219, 16.109397888183594, 17.01866912841797, 17.927942276000977, 18.83721351623535, 19.74648666381836, 20.655757904052734, 21.56502914428711, 22.474302291870117, 23.383573532104492, 24.2928466796875, 25.202117919921875, 26.11138916015625, 27.020660400390625, 27.929933547973633]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 13.0, 13.0, 13.0, 20.0, 25.0, 17.0, 20.0, 31.0, 28.0, 26.0, 36.0, 32.0, 43.0, 35.0, 37.0, 34.0, 42.0, 45.0, 29.0, 39.0, 24.0, 46.0, 40.0, 38.0, 28.0, 41.0, 29.0, 31.0, 21.0, 18.0, 17.0, 12.0, 20.0, 7.0, 4.0, 6.0, 8.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.373046875, -3.27398681640625, -3.1749267578125, -3.07586669921875, -2.976806640625, -2.87774658203125, -2.7786865234375, -2.67962646484375, -2.58056640625, -2.48150634765625, -2.3824462890625, -2.28338623046875, -2.184326171875, -2.08526611328125, -1.9862060546875, -1.88714599609375, -1.7880859375, -1.68902587890625, -1.5899658203125, -1.49090576171875, -1.391845703125, -1.29278564453125, -1.1937255859375, -1.09466552734375, -0.99560546875, -0.89654541015625, -0.7974853515625, -0.69842529296875, -0.599365234375, -0.50030517578125, -0.4012451171875, -0.30218505859375, -0.203125, -0.10406494140625, -0.0050048828125, 0.09405517578125, 0.193115234375, 0.29217529296875, 0.3912353515625, 0.49029541015625, 0.58935546875, 0.68841552734375, 0.7874755859375, 0.88653564453125, 0.985595703125, 1.08465576171875, 1.1837158203125, 1.28277587890625, 1.3818359375, 1.48089599609375, 1.5799560546875, 1.67901611328125, 1.778076171875, 1.87713623046875, 1.9761962890625, 2.07525634765625, 2.17431640625, 2.27337646484375, 2.3724365234375, 2.47149658203125, 2.570556640625, 2.66961669921875, 2.7686767578125, 2.86773681640625, 2.966796875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 5.0, 13.0, 11.0, 26.0, 17.0, 34.0, 37.0, 31.0, 60.0, 84.0, 130.0, 227.0, 407.0, 961.0, 2310.0, 7732.0, 36116.0, 321894.0, 2139542.0, 1480306.0, 172600.0, 22670.0, 5502.0, 1816.0, 723.0, 380.0, 201.0, 113.0, 78.0, 57.0, 39.0, 30.0, 22.0, 23.0, 19.0, 13.0, 10.0, 7.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.5, -7.2908935546875, -7.081787109375, -6.8726806640625, -6.66357421875, -6.4544677734375, -6.245361328125, -6.0362548828125, -5.8271484375, -5.6180419921875, -5.408935546875, -5.1998291015625, -4.99072265625, -4.7816162109375, -4.572509765625, -4.3634033203125, -4.154296875, -3.9451904296875, -3.736083984375, -3.5269775390625, -3.31787109375, -3.1087646484375, -2.899658203125, -2.6905517578125, -2.4814453125, -2.2723388671875, -2.063232421875, -1.8541259765625, -1.64501953125, -1.4359130859375, -1.226806640625, -1.0177001953125, -0.80859375, -0.5994873046875, -0.390380859375, -0.1812744140625, 0.02783203125, 0.2369384765625, 0.446044921875, 0.6551513671875, 0.8642578125, 1.0733642578125, 1.282470703125, 1.4915771484375, 1.70068359375, 1.9097900390625, 2.118896484375, 2.3280029296875, 2.537109375, 2.7462158203125, 2.955322265625, 3.1644287109375, 3.37353515625, 3.5826416015625, 3.791748046875, 4.0008544921875, 4.2099609375, 4.4190673828125, 4.628173828125, 4.8372802734375, 5.04638671875, 5.2554931640625, 5.464599609375, 5.6737060546875, 5.8828125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 29.0, 72.0, 248.0, 897.0, 1815.0, 740.0, 199.0, 55.0, 16.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.171875, -25.4130859375, -24.654296875, -23.8955078125, -23.13671875, -22.3779296875, -21.619140625, -20.8603515625, -20.1015625, -19.3427734375, -18.583984375, -17.8251953125, -17.06640625, -16.3076171875, -15.548828125, -14.7900390625, -14.03125, -13.2724609375, -12.513671875, -11.7548828125, -10.99609375, -10.2373046875, -9.478515625, -8.7197265625, -7.9609375, -7.2021484375, -6.443359375, -5.6845703125, -4.92578125, -4.1669921875, -3.408203125, -2.6494140625, -1.890625, -1.1318359375, -0.373046875, 0.3857421875, 1.14453125, 1.9033203125, 2.662109375, 3.4208984375, 4.1796875, 4.9384765625, 5.697265625, 6.4560546875, 7.21484375, 7.9736328125, 8.732421875, 9.4912109375, 10.25, 11.0087890625, 11.767578125, 12.5263671875, 13.28515625, 14.0439453125, 14.802734375, 15.5615234375, 16.3203125, 17.0791015625, 17.837890625, 18.5966796875, 19.35546875, 20.1142578125, 20.873046875, 21.6318359375, 22.390625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 7.0, 11.0, 29.0, 52.0, 249.0, 1423.0, 499517.0, 3690395.0, 2057.0, 400.0, 93.0, 25.0, 12.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.46875, -47.82373046875, -46.1787109375, -44.53369140625, -42.888671875, -41.24365234375, -39.5986328125, -37.95361328125, -36.30859375, -34.66357421875, -33.0185546875, -31.37353515625, -29.728515625, -28.08349609375, -26.4384765625, -24.79345703125, -23.1484375, -21.50341796875, -19.8583984375, -18.21337890625, -16.568359375, -14.92333984375, -13.2783203125, -11.63330078125, -9.98828125, -8.34326171875, -6.6982421875, -5.05322265625, -3.408203125, -1.76318359375, -0.1181640625, 1.52685546875, 3.171875, 4.81689453125, 6.4619140625, 8.10693359375, 9.751953125, 11.39697265625, 13.0419921875, 14.68701171875, 16.33203125, 17.97705078125, 19.6220703125, 21.26708984375, 22.912109375, 24.55712890625, 26.2021484375, 27.84716796875, 29.4921875, 31.13720703125, 32.7822265625, 34.42724609375, 36.072265625, 37.71728515625, 39.3623046875, 41.00732421875, 42.65234375, 44.29736328125, 45.9423828125, 47.58740234375, 49.232421875, 50.87744140625, 52.5224609375, 54.16748046875, 55.8125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 31.0, 164.0, 473.0, 279.0, 51.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.59152221679688, -101.88837432861328, -99.18522644042969, -96.4820785522461, -93.7789306640625, -91.0757827758789, -88.37263488769531, -85.66949462890625, -82.96633911132812, -80.26319122314453, -77.56004333496094, -74.85689544677734, -72.15374755859375, -69.45059967041016, -66.74745178222656, -64.0443115234375, -61.341163635253906, -58.63801574707031, -55.93486785888672, -53.231719970703125, -50.52857208251953, -47.82542419433594, -45.12228012084961, -42.419132232666016, -39.71598434448242, -37.01283645629883, -34.309688568115234, -31.606542587280273, -28.90339469909668, -26.200246810913086, -23.497100830078125, -20.79395294189453, -18.090805053710938, -15.387657165527344, -12.684510231018066, -9.981363296508789, -7.278215408325195, -4.575067520141602, -1.8719215393066406, 0.8312263488769531, 3.534374237060547, 6.237521648406982, 8.940669059753418, 11.643815994262695, 14.346963882446289, 17.050111770629883, 19.753257751464844, 22.456405639648438, 25.15955352783203, 27.862701416015625, 30.56584930419922, 33.26899719238281, 35.972145080566406, 38.67529296875, 41.37843704223633, 44.08158493041992, 46.784732818603516, 49.48788070678711, 52.1910285949707, 54.89417266845703, 57.597320556640625, 60.30046844482422, 63.00361633300781, 65.7067642211914, 68.409912109375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 17.0, 10.0, 8.0, 10.0, 14.0, 17.0, 22.0, 14.0, 27.0, 19.0, 29.0, 29.0, 43.0, 37.0, 32.0, 47.0, 40.0, 45.0, 27.0, 49.0, 25.0, 33.0, 38.0, 33.0, 42.0, 28.0, 29.0, 32.0, 22.0, 24.0, 25.0, 25.0, 21.0, 19.0, 11.0, 14.0, 6.0, 7.0, 2.0, 4.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.871299743652344, -25.081384658813477, -24.291467666625977, -23.50155258178711, -22.711637496948242, -21.921722412109375, -21.131805419921875, -20.341890335083008, -19.55197525024414, -18.762060165405273, -17.972143173217773, -17.182228088378906, -16.39231300354004, -15.602396965026855, -14.812480926513672, -14.022565841674805, -13.232648849487305, -12.442732810974121, -11.652817726135254, -10.86290168762207, -10.072986602783203, -9.28307056427002, -8.493154525756836, -7.7032389640808105, -6.913323402404785, -6.12340784072876, -5.333492279052734, -4.543576240539551, -3.7536606788635254, -2.9637451171875, -2.1738290786743164, -1.383913516998291, -0.5939960479736328, 0.19591963291168213, 0.9858353137969971, 1.7757511138916016, 2.565666675567627, 3.3555822372436523, 4.145498275756836, 4.935413837432861, 5.725329399108887, 6.515244960784912, 7.3051605224609375, 8.095076560974121, 8.884992599487305, 9.674907684326172, 10.464823722839355, 11.254739761352539, 12.044654846191406, 12.83457088470459, 13.624485969543457, 14.41440200805664, 15.204317092895508, 15.994233131408691, 16.784149169921875, 17.574064254760742, 18.36397933959961, 19.153894424438477, 19.943811416625977, 20.733726501464844, 21.52364158630371, 22.313556671142578, 23.103473663330078, 23.893388748168945, 24.683305740356445]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 3.0, 8.0, 5.0, 8.0, 7.0, 7.0, 10.0, 11.0, 15.0, 18.0, 21.0, 17.0, 15.0, 20.0, 23.0, 21.0, 26.0, 26.0, 38.0, 30.0, 23.0, 40.0, 30.0, 31.0, 36.0, 45.0, 39.0, 38.0, 41.0, 42.0, 27.0, 40.0, 33.0, 28.0, 29.0, 24.0, 21.0, 18.0, 14.0, 23.0, 10.0, 10.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8910675048828125, -1.820220947265625, -1.7493743896484375, -1.67852783203125, -1.6076812744140625, -1.536834716796875, -1.4659881591796875, -1.3951416015625, -1.3242950439453125, -1.253448486328125, -1.1826019287109375, -1.11175537109375, -1.0409088134765625, -0.970062255859375, -0.8992156982421875, -0.828369140625, -0.7575225830078125, -0.686676025390625, -0.6158294677734375, -0.54498291015625, -0.4741363525390625, -0.403289794921875, -0.3324432373046875, -0.2615966796875, -0.1907501220703125, -0.119903564453125, -0.0490570068359375, 0.02178955078125, 0.0926361083984375, 0.163482666015625, 0.2343292236328125, 0.30517578125, 0.3760223388671875, 0.446868896484375, 0.5177154541015625, 0.58856201171875, 0.6594085693359375, 0.730255126953125, 0.8011016845703125, 0.8719482421875, 0.9427947998046875, 1.013641357421875, 1.0844879150390625, 1.15533447265625, 1.2261810302734375, 1.297027587890625, 1.3678741455078125, 1.438720703125, 1.5095672607421875, 1.580413818359375, 1.6512603759765625, 1.72210693359375, 1.7929534912109375, 1.863800048828125, 1.9346466064453125, 2.0054931640625, 2.0763397216796875, 2.147186279296875, 2.2180328369140625, 2.28887939453125, 2.3597259521484375, 2.430572509765625, 2.5014190673828125, 2.572265625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 5.0, 8.0, 15.0, 18.0, 21.0, 33.0, 42.0, 58.0, 104.0, 181.0, 254.0, 387.0, 573.0, 906.0, 1395.0, 2247.0, 3391.0, 5445.0, 8370.0, 13051.0, 20726.0, 33074.0, 56067.0, 100223.0, 200746.0, 279901.0, 136057.0, 72586.0, 42062.0, 25483.0, 16397.0, 10226.0, 6570.0, 4330.0, 2733.0, 1741.0, 1100.0, 726.0, 462.0, 288.0, 195.0, 114.0, 80.0, 50.0, 42.0, 31.0, 20.0, 7.0, 6.0, 6.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.401611328125, -0.3873863220214844, -0.37316131591796875, -0.3589363098144531, -0.3447113037109375, -0.3304862976074219, -0.31626129150390625, -0.3020362854003906, -0.287811279296875, -0.2735862731933594, -0.25936126708984375, -0.24513626098632812, -0.2309112548828125, -0.21668624877929688, -0.20246124267578125, -0.18823623657226562, -0.17401123046875, -0.15978622436523438, -0.14556121826171875, -0.13133621215820312, -0.1171112060546875, -0.10288619995117188, -0.08866119384765625, -0.07443618774414062, -0.060211181640625, -0.045986175537109375, -0.03176116943359375, -0.017536163330078125, -0.0033111572265625, 0.010913848876953125, 0.02513885498046875, 0.039363861083984375, 0.0535888671875, 0.06781387329101562, 0.08203887939453125, 0.09626388549804688, 0.1104888916015625, 0.12471389770507812, 0.13893890380859375, 0.15316390991210938, 0.167388916015625, 0.18161392211914062, 0.19583892822265625, 0.21006393432617188, 0.2242889404296875, 0.23851394653320312, 0.25273895263671875, 0.2669639587402344, 0.28118896484375, 0.2954139709472656, 0.30963897705078125, 0.3238639831542969, 0.3380889892578125, 0.3523139953613281, 0.36653900146484375, 0.3807640075683594, 0.394989013671875, 0.4092140197753906, 0.42343902587890625, 0.4376640319824219, 0.4518890380859375, 0.4661140441894531, 0.48033905029296875, 0.4945640563964844, 0.5087890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 2.0, 3.0, 9.0, 7.0, 10.0, 12.0, 15.0, 21.0, 12.0, 13.0, 31.0, 19.0, 22.0, 30.0, 29.0, 41.0, 38.0, 41.0, 48.0, 38.0, 35.0, 1066.0, 40.0, 33.0, 36.0, 47.0, 37.0, 34.0, 32.0, 30.0, 47.0, 13.0, 27.0, 21.0, 20.0, 14.0, 17.0, 8.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.65826416015625, -1.6065673828125, -1.55487060546875, -1.503173828125, -1.45147705078125, -1.3997802734375, -1.34808349609375, -1.29638671875, -1.24468994140625, -1.1929931640625, -1.14129638671875, -1.089599609375, -1.03790283203125, -0.9862060546875, -0.93450927734375, -0.8828125, -0.83111572265625, -0.7794189453125, -0.72772216796875, -0.676025390625, -0.62432861328125, -0.5726318359375, -0.52093505859375, -0.46923828125, -0.41754150390625, -0.3658447265625, -0.31414794921875, -0.262451171875, -0.21075439453125, -0.1590576171875, -0.10736083984375, -0.0556640625, -0.00396728515625, 0.0477294921875, 0.09942626953125, 0.151123046875, 0.20281982421875, 0.2545166015625, 0.30621337890625, 0.35791015625, 0.40960693359375, 0.4613037109375, 0.51300048828125, 0.564697265625, 0.61639404296875, 0.6680908203125, 0.71978759765625, 0.771484375, 0.82318115234375, 0.8748779296875, 0.92657470703125, 0.978271484375, 1.02996826171875, 1.0816650390625, 1.13336181640625, 1.18505859375, 1.23675537109375, 1.2884521484375, 1.34014892578125, 1.391845703125, 1.44354248046875, 1.4952392578125, 1.54693603515625, 1.5986328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 13.0, 14.0, 17.0, 27.0, 50.0, 74.0, 102.0, 170.0, 233.0, 377.0, 555.0, 820.0, 1297.0, 1940.0, 2870.0, 4491.0, 6925.0, 10835.0, 17182.0, 27605.0, 45995.0, 79319.0, 152250.0, 1350179.0, 174465.0, 87663.0, 49990.0, 29728.0, 18411.0, 11704.0, 7560.0, 4975.0, 3144.0, 2189.0, 1325.0, 908.0, 598.0, 387.0, 243.0, 177.0, 108.0, 91.0, 41.0, 27.0, 25.0, 14.0, 10.0, 6.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453857421875, -0.4399299621582031, -0.42600250244140625, -0.4120750427246094, -0.3981475830078125, -0.3842201232910156, -0.37029266357421875, -0.3563652038574219, -0.342437744140625, -0.3285102844238281, -0.31458282470703125, -0.3006553649902344, -0.2867279052734375, -0.2728004455566406, -0.25887298583984375, -0.24494552612304688, -0.23101806640625, -0.21709060668945312, -0.20316314697265625, -0.18923568725585938, -0.1753082275390625, -0.16138076782226562, -0.14745330810546875, -0.13352584838867188, -0.119598388671875, -0.10567092895507812, -0.09174346923828125, -0.07781600952148438, -0.0638885498046875, -0.049961090087890625, -0.03603363037109375, -0.022106170654296875, -0.0081787109375, 0.005748748779296875, 0.01967620849609375, 0.033603668212890625, 0.0475311279296875, 0.061458587646484375, 0.07538604736328125, 0.08931350708007812, 0.103240966796875, 0.11716842651367188, 0.13109588623046875, 0.14502334594726562, 0.1589508056640625, 0.17287826538085938, 0.18680572509765625, 0.20073318481445312, 0.21466064453125, 0.22858810424804688, 0.24251556396484375, 0.2564430236816406, 0.2703704833984375, 0.2842979431152344, 0.29822540283203125, 0.3121528625488281, 0.326080322265625, 0.3400077819824219, 0.35393524169921875, 0.3678627014160156, 0.3817901611328125, 0.3957176208496094, 0.40964508056640625, 0.4235725402832031, 0.4375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 4.0, 12.0, 12.0, 14.0, 12.0, 15.0, 19.0, 24.0, 25.0, 34.0, 38.0, 48.0, 46.0, 52.0, 47.0, 62.0, 59.0, 50.0, 52.0, 48.0, 54.0, 37.0, 32.0, 33.0, 28.0, 20.0, 19.0, 23.0, 13.0, 15.0, 5.0, 7.0, 2.0, 2.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00034356117248535156, -0.00033297762274742126, -0.00032239407300949097, -0.00031181052327156067, -0.00030122697353363037, -0.0002906434237957001, -0.0002800598740577698, -0.0002694763243198395, -0.0002588927745819092, -0.0002483092248439789, -0.00023772567510604858, -0.00022714212536811829, -0.000216558575630188, -0.0002059750258922577, -0.0001953914761543274, -0.0001848079264163971, -0.0001742243766784668, -0.0001636408269405365, -0.0001530572772026062, -0.0001424737274646759, -0.0001318901777267456, -0.00012130662798881531, -0.00011072307825088501, -0.00010013952851295471, -8.955597877502441e-05, -7.897242903709412e-05, -6.838887929916382e-05, -5.780532956123352e-05, -4.722177982330322e-05, -3.6638230085372925e-05, -2.6054680347442627e-05, -1.547113060951233e-05, -4.887580871582031e-06, 5.695968866348267e-06, 1.6279518604278564e-05, 2.6863068342208862e-05, 3.744661808013916e-05, 4.803016781806946e-05, 5.8613717555999756e-05, 6.919726729393005e-05, 7.978081703186035e-05, 9.036436676979065e-05, 0.00010094791650772095, 0.00011153146624565125, 0.00012211501598358154, 0.00013269856572151184, 0.00014328211545944214, 0.00015386566519737244, 0.00016444921493530273, 0.00017503276467323303, 0.00018561631441116333, 0.00019619986414909363, 0.00020678341388702393, 0.00021736696362495422, 0.00022795051336288452, 0.00023853406310081482, 0.0002491176128387451, 0.0002597011625766754, 0.0002702847123146057, 0.000280868262052536, 0.0002914518117904663, 0.0003020353615283966, 0.0003126189112663269, 0.0003232024610042572, 0.0003337860107421875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 10.0, 6.0, 6.0, 12.0, 10.0, 17.0, 30.0, 37.0, 62.0, 76.0, 113.0, 159.0, 254.0, 409.0, 831.0, 2641.0, 1037891.0, 3751.0, 911.0, 461.0, 262.0, 174.0, 119.0, 89.0, 45.0, 50.0, 39.0, 23.0, 15.0, 15.0, 11.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00811767578125, -0.007868289947509766, -0.007618904113769531, -0.007369518280029297, -0.0071201324462890625, -0.006870746612548828, -0.006621360778808594, -0.006371974945068359, -0.006122589111328125, -0.005873203277587891, -0.005623817443847656, -0.005374431610107422, -0.0051250457763671875, -0.004875659942626953, -0.004626274108886719, -0.004376888275146484, -0.00412750244140625, -0.0038781166076660156, -0.0036287307739257812, -0.003379344940185547, -0.0031299591064453125, -0.002880573272705078, -0.0026311874389648438, -0.0023818016052246094, -0.002132415771484375, -0.0018830299377441406, -0.0016336441040039062, -0.0013842582702636719, -0.0011348724365234375, -0.0008854866027832031, -0.0006361007690429688, -0.0003867149353027344, -0.0001373291015625, 0.00011205673217773438, 0.00036144256591796875, 0.0006108283996582031, 0.0008602142333984375, 0.0011096000671386719, 0.0013589859008789062, 0.0016083717346191406, 0.001857757568359375, 0.0021071434020996094, 0.0023565292358398438, 0.002605915069580078, 0.0028553009033203125, 0.003104686737060547, 0.0033540725708007812, 0.0036034584045410156, 0.00385284423828125, 0.004102230072021484, 0.004351615905761719, 0.004601001739501953, 0.0048503875732421875, 0.005099773406982422, 0.005349159240722656, 0.005598545074462891, 0.005847930908203125, 0.006097316741943359, 0.006346702575683594, 0.006596088409423828, 0.0068454742431640625, 0.007094860076904297, 0.007344245910644531, 0.007593631744384766, 0.007843017578125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 65.0, 553.0, 364.0, 27.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001295246183872223, -0.0012669855495914817, -0.0012387249153107405, -0.0012104642810299993, -0.001182203646749258, -0.0011539431288838387, -0.0011256824946030974, -0.0010974218603223562, -0.001069161226041615, -0.0010409005917608738, -0.0010126399574801326, -0.0009843793231993914, -0.0009561187471263111, -0.0009278581128455698, -0.0008995975367724895, -0.0008713369024917483, -0.0008430762682110071, -0.0008148156339302659, -0.0007865549996495247, -0.0007582944235764444, -0.0007300337892957032, -0.000701773155014962, -0.0006735125789418817, -0.0006452519446611404, -0.0006169913103803992, -0.000588730676099658, -0.0005604700418189168, -0.0005322094657458365, -0.0005039488314650953, -0.00047568819718435407, -0.0004474275920074433, -0.00041916698683053255, -0.0003909062943421304, -0.0003626456600613892, -0.00033438505488447845, -0.0003061244497075677, -0.0002778638154268265, -0.00024960318114608526, -0.0002213425759691745, -0.00019308195624034852, -0.00016482133651152253, -0.00013656071678269655, -0.00010830009705387056, -8.003947732504457e-05, -5.1778857596218586e-05, -2.35182378673926e-05, 4.742381861433387e-06, 3.300300159025937e-05, 6.126362131908536e-05, 8.952424104791135e-05, 0.00011778486077673733, 0.00014604548050556332, 0.0001743061002343893, 0.0002025667199632153, 0.00023082733969204128, 0.00025908794486895204, 0.00028734857914969325, 0.00031560921343043447, 0.0003438698186073452, 0.000372130423784256, 0.0004003910580649972, 0.0004286516923457384, 0.00045691229752264917, 0.0004851729026995599, 0.0005134335369803011]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 12.0, 11.0, 16.0, 12.0, 9.0, 13.0, 25.0, 22.0, 18.0, 26.0, 24.0, 27.0, 44.0, 43.0, 44.0, 40.0, 37.0, 37.0, 46.0, 37.0, 43.0, 52.0, 39.0, 43.0, 25.0, 33.0, 31.0, 25.0, 13.0, 20.0, 23.0, 16.0, 15.0, 12.0, 11.0, 15.0, 10.0, 6.0, 2.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00020182132720947266, -0.00019604898989200592, -0.00019027665257453918, -0.00018450431525707245, -0.0001787319779396057, -0.00017295964062213898, -0.00016718730330467224, -0.0001614149659872055, -0.00015564262866973877, -0.00014987029135227203, -0.0001440979540348053, -0.00013832561671733856, -0.00013255327939987183, -0.0001267809420824051, -0.00012100860476493835, -0.00011523626744747162, -0.00010946393013000488, -0.00010369159281253815, -9.791925549507141e-05, -9.214691817760468e-05, -8.637458086013794e-05, -8.06022435426712e-05, -7.482990622520447e-05, -6.905756890773773e-05, -6.3285231590271e-05, -5.751289427280426e-05, -5.1740556955337524e-05, -4.596821963787079e-05, -4.019588232040405e-05, -3.442354500293732e-05, -2.865120768547058e-05, -2.2878870368003845e-05, -1.710653305053711e-05, -1.1334195733070374e-05, -5.561858415603638e-06, 2.1047890186309814e-07, 5.982816219329834e-06, 1.175515353679657e-05, 1.7527490854263306e-05, 2.329982817173004e-05, 2.9072165489196777e-05, 3.484450280666351e-05, 4.061684012413025e-05, 4.6389177441596985e-05, 5.216151475906372e-05, 5.7933852076530457e-05, 6.370618939399719e-05, 6.947852671146393e-05, 7.525086402893066e-05, 8.10232013463974e-05, 8.679553866386414e-05, 9.256787598133087e-05, 9.834021329879761e-05, 0.00010411255061626434, 0.00010988488793373108, 0.00011565722525119781, 0.00012142956256866455, 0.0001272018998861313, 0.00013297423720359802, 0.00013874657452106476, 0.0001445189118385315, 0.00015029124915599823, 0.00015606358647346497, 0.0001618359237909317, 0.00016760826110839844]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 3.0, 8.0, 5.0, 8.0, 7.0, 7.0, 10.0, 11.0, 15.0, 18.0, 21.0, 17.0, 15.0, 20.0, 23.0, 21.0, 26.0, 26.0, 38.0, 30.0, 23.0, 40.0, 30.0, 31.0, 36.0, 45.0, 39.0, 38.0, 41.0, 42.0, 27.0, 40.0, 33.0, 28.0, 29.0, 23.0, 22.0, 18.0, 14.0, 23.0, 10.0, 10.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8910675048828125, -1.820220947265625, -1.7493743896484375, -1.67852783203125, -1.6076812744140625, -1.536834716796875, -1.4659881591796875, -1.3951416015625, -1.3242950439453125, -1.253448486328125, -1.1826019287109375, -1.11175537109375, -1.0409088134765625, -0.970062255859375, -0.8992156982421875, -0.828369140625, -0.7575225830078125, -0.686676025390625, -0.6158294677734375, -0.54498291015625, -0.4741363525390625, -0.403289794921875, -0.3324432373046875, -0.2615966796875, -0.1907501220703125, -0.119903564453125, -0.0490570068359375, 0.02178955078125, 0.0926361083984375, 0.163482666015625, 0.2343292236328125, 0.30517578125, 0.3760223388671875, 0.446868896484375, 0.5177154541015625, 0.58856201171875, 0.6594085693359375, 0.730255126953125, 0.8011016845703125, 0.8719482421875, 0.9427947998046875, 1.013641357421875, 1.0844879150390625, 1.15533447265625, 1.2261810302734375, 1.297027587890625, 1.3678741455078125, 1.438720703125, 1.5095672607421875, 1.580413818359375, 1.6512603759765625, 1.72210693359375, 1.7929534912109375, 1.863800048828125, 1.9346466064453125, 2.0054931640625, 2.0763397216796875, 2.147186279296875, 2.2180328369140625, 2.28887939453125, 2.3597259521484375, 2.430572509765625, 2.5014190673828125, 2.572265625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 12.0, 16.0, 15.0, 27.0, 26.0, 44.0, 44.0, 80.0, 91.0, 127.0, 158.0, 229.0, 329.0, 483.0, 742.0, 1207.0, 2095.0, 4212.0, 10528.0, 39074.0, 257153.0, 594055.0, 103101.0, 20357.0, 6787.0, 3014.0, 1612.0, 933.0, 553.0, 402.0, 271.0, 198.0, 149.0, 130.0, 84.0, 61.0, 46.0, 36.0, 20.0, 17.0, 12.0, 6.0, 5.0, 2.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.2557373046875, -4.105224609375, -3.9547119140625, -3.80419921875, -3.6536865234375, -3.503173828125, -3.3526611328125, -3.2021484375, -3.0516357421875, -2.901123046875, -2.7506103515625, -2.60009765625, -2.4495849609375, -2.299072265625, -2.1485595703125, -1.998046875, -1.8475341796875, -1.697021484375, -1.5465087890625, -1.39599609375, -1.2454833984375, -1.094970703125, -0.9444580078125, -0.7939453125, -0.6434326171875, -0.492919921875, -0.3424072265625, -0.19189453125, -0.0413818359375, 0.109130859375, 0.2596435546875, 0.41015625, 0.5606689453125, 0.711181640625, 0.8616943359375, 1.01220703125, 1.1627197265625, 1.313232421875, 1.4637451171875, 1.6142578125, 1.7647705078125, 1.915283203125, 2.0657958984375, 2.21630859375, 2.3668212890625, 2.517333984375, 2.6678466796875, 2.818359375, 2.9688720703125, 3.119384765625, 3.2698974609375, 3.42041015625, 3.5709228515625, 3.721435546875, 3.8719482421875, 4.0224609375, 4.1729736328125, 4.323486328125, 4.4739990234375, 4.62451171875, 4.7750244140625, 4.925537109375, 5.0760498046875, 5.2265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 9.0, 5.0, 13.0, 7.0, 13.0, 16.0, 18.0, 19.0, 33.0, 31.0, 36.0, 57.0, 42.0, 85.0, 158.0, 435.0, 1483.0, 155.0, 83.0, 63.0, 42.0, 44.0, 40.0, 31.0, 24.0, 22.0, 18.0, 12.0, 10.0, 8.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.1064453125, -8.822265625, -8.5380859375, -8.25390625, -7.9697265625, -7.685546875, -7.4013671875, -7.1171875, -6.8330078125, -6.548828125, -6.2646484375, -5.98046875, -5.6962890625, -5.412109375, -5.1279296875, -4.84375, -4.5595703125, -4.275390625, -3.9912109375, -3.70703125, -3.4228515625, -3.138671875, -2.8544921875, -2.5703125, -2.2861328125, -2.001953125, -1.7177734375, -1.43359375, -1.1494140625, -0.865234375, -0.5810546875, -0.296875, -0.0126953125, 0.271484375, 0.5556640625, 0.83984375, 1.1240234375, 1.408203125, 1.6923828125, 1.9765625, 2.2607421875, 2.544921875, 2.8291015625, 3.11328125, 3.3974609375, 3.681640625, 3.9658203125, 4.25, 4.5341796875, 4.818359375, 5.1025390625, 5.38671875, 5.6708984375, 5.955078125, 6.2392578125, 6.5234375, 6.8076171875, 7.091796875, 7.3759765625, 7.66015625, 7.9443359375, 8.228515625, 8.5126953125, 8.796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 5.0, 7.0, 14.0, 19.0, 23.0, 36.0, 36.0, 72.0, 82.0, 102.0, 169.0, 320.0, 570.0, 1422.0, 24516.0, 3110201.0, 5751.0, 1042.0, 414.0, 244.0, 175.0, 115.0, 91.0, 65.0, 48.0, 47.0, 27.0, 14.0, 13.0, 15.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.5625, -18.957763671875, -18.35302734375, -17.748291015625, -17.1435546875, -16.538818359375, -15.93408203125, -15.329345703125, -14.724609375, -14.119873046875, -13.51513671875, -12.910400390625, -12.3056640625, -11.700927734375, -11.09619140625, -10.491455078125, -9.88671875, -9.281982421875, -8.67724609375, -8.072509765625, -7.4677734375, -6.863037109375, -6.25830078125, -5.653564453125, -5.048828125, -4.444091796875, -3.83935546875, -3.234619140625, -2.6298828125, -2.025146484375, -1.42041015625, -0.815673828125, -0.2109375, 0.393798828125, 0.99853515625, 1.603271484375, 2.2080078125, 2.812744140625, 3.41748046875, 4.022216796875, 4.626953125, 5.231689453125, 5.83642578125, 6.441162109375, 7.0458984375, 7.650634765625, 8.25537109375, 8.860107421875, 9.46484375, 10.069580078125, 10.67431640625, 11.279052734375, 11.8837890625, 12.488525390625, 13.09326171875, 13.697998046875, 14.302734375, 14.907470703125, 15.51220703125, 16.116943359375, 16.7216796875, 17.326416015625, 17.93115234375, 18.535888671875, 19.140625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 47.0, 967.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-314.534912109375, -308.74957275390625, -302.9642333984375, -297.17889404296875, -291.3935546875, -285.60821533203125, -279.8228759765625, -274.0375671386719, -268.2522277832031, -262.4668884277344, -256.6815490722656, -250.89620971679688, -245.1108856201172, -239.32554626464844, -233.5402069091797, -227.75486755371094, -221.9695281982422, -216.18418884277344, -210.3988494873047, -204.613525390625, -198.82818603515625, -193.0428466796875, -187.25750732421875, -181.47216796875, -175.68682861328125, -169.9014892578125, -164.11614990234375, -158.330810546875, -152.5454864501953, -146.76014709472656, -140.9748077392578, -135.18946838378906, -129.40415954589844, -123.61882019042969, -117.83348846435547, -112.04814910888672, -106.2628173828125, -100.47747802734375, -94.692138671875, -88.90679931640625, -83.1214599609375, -77.33612060546875, -71.55078887939453, -65.76544952392578, -59.9801139831543, -54.19477844238281, -48.40943908691406, -42.62410354614258, -36.83877182006836, -31.053436279296875, -25.268098831176758, -19.48276138305664, -13.697425842285156, -7.912090301513672, -2.126750946044922, 3.6585845947265625, 9.443920135498047, 15.229256629943848, 21.01459312438965, 26.799930572509766, 32.58526611328125, 38.370601654052734, 44.155941009521484, 49.94127655029297, 55.72661209106445]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 4.0, 9.0, 4.0, 7.0, 7.0, 7.0, 7.0, 16.0, 13.0, 16.0, 18.0, 15.0, 21.0, 19.0, 30.0, 23.0, 26.0, 24.0, 32.0, 27.0, 42.0, 27.0, 33.0, 34.0, 34.0, 45.0, 36.0, 33.0, 30.0, 28.0, 37.0, 27.0, 27.0, 20.0, 21.0, 26.0, 19.0, 22.0, 13.0, 20.0, 10.0, 15.0, 12.0, 12.0, 10.0, 7.0, 10.0, 10.0, 5.0, 1.0, 6.0, 3.0, 1.0], "bins": [-18.782054901123047, -18.286327362060547, -17.790599822998047, -17.294872283935547, -16.799144744873047, -16.303417205810547, -15.80768871307373, -15.31196117401123, -14.816232681274414, -14.320505142211914, -13.824777603149414, -13.329050064086914, -12.833321571350098, -12.337594032287598, -11.841866493225098, -11.346138954162598, -10.850411415100098, -10.354683876037598, -9.858956336975098, -9.363227844238281, -8.867500305175781, -8.371772766113281, -7.876045227050781, -7.380317687988281, -6.884589672088623, -6.388862133026123, -5.893134117126465, -5.397406578063965, -4.901679039001465, -4.405951023101807, -3.9102234840393066, -3.4144957065582275, -2.918768882751465, -2.4230411052703857, -1.9273134469985962, -1.4315857887268066, -0.9358580112457275, -0.44013023376464844, 0.05559730529785156, 0.5513250827789307, 1.0470528602600098, 1.5427806377410889, 2.038508415222168, 2.534235954284668, 3.029963731765747, 3.525691509246826, 4.021419048309326, 4.517147064208984, 5.012874603271484, 5.508602142333984, 6.004330158233643, 6.500057697296143, 6.995785713195801, 7.491513252258301, 7.987240791320801, 8.4829683303833, 8.978696823120117, 9.474424362182617, 9.970151901245117, 10.465879440307617, 10.961607933044434, 11.457335472106934, 11.953063011169434, 12.448790550231934, 12.944518089294434]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 6.0, 3.0, 5.0, 13.0, 11.0, 11.0, 12.0, 13.0, 11.0, 18.0, 21.0, 19.0, 21.0, 19.0, 26.0, 27.0, 34.0, 32.0, 32.0, 40.0, 23.0, 39.0, 39.0, 38.0, 37.0, 33.0, 38.0, 37.0, 43.0, 38.0, 37.0, 27.0, 37.0, 21.0, 11.0, 18.0, 20.0, 15.0, 16.0, 14.0, 9.0, 9.0, 8.0, 5.0, 2.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.798828125, -2.714263916015625, -2.62969970703125, -2.545135498046875, -2.4605712890625, -2.376007080078125, -2.29144287109375, -2.206878662109375, -2.122314453125, -2.037750244140625, -1.95318603515625, -1.868621826171875, -1.7840576171875, -1.699493408203125, -1.61492919921875, -1.530364990234375, -1.44580078125, -1.361236572265625, -1.27667236328125, -1.192108154296875, -1.1075439453125, -1.022979736328125, -0.93841552734375, -0.853851318359375, -0.769287109375, -0.684722900390625, -0.60015869140625, -0.515594482421875, -0.4310302734375, -0.346466064453125, -0.26190185546875, -0.177337646484375, -0.0927734375, -0.008209228515625, 0.07635498046875, 0.160919189453125, 0.2454833984375, 0.330047607421875, 0.41461181640625, 0.499176025390625, 0.583740234375, 0.668304443359375, 0.75286865234375, 0.837432861328125, 0.9219970703125, 1.006561279296875, 1.09112548828125, 1.175689697265625, 1.26025390625, 1.344818115234375, 1.42938232421875, 1.513946533203125, 1.5985107421875, 1.683074951171875, 1.76763916015625, 1.852203369140625, 1.936767578125, 2.021331787109375, 2.10589599609375, 2.190460205078125, 2.2750244140625, 2.359588623046875, 2.44415283203125, 2.528717041015625, 2.61328125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 4.0, 5.0, 4.0, 7.0, 16.0, 6.0, 13.0, 17.0, 19.0, 37.0, 30.0, 49.0, 49.0, 61.0, 77.0, 108.0, 147.0, 146.0, 250.0, 331.0, 467.0, 706.0, 1121.0, 2488.0, 14065.0, 985587.0, 3105949.0, 73612.0, 4378.0, 1508.0, 869.0, 576.0, 410.0, 275.0, 222.0, 161.0, 111.0, 95.0, 61.0, 44.0, 40.0, 32.0, 19.0, 27.0, 20.0, 23.0, 8.0, 7.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.8671875, -13.436767578125, -13.00634765625, -12.575927734375, -12.1455078125, -11.715087890625, -11.28466796875, -10.854248046875, -10.423828125, -9.993408203125, -9.56298828125, -9.132568359375, -8.7021484375, -8.271728515625, -7.84130859375, -7.410888671875, -6.98046875, -6.550048828125, -6.11962890625, -5.689208984375, -5.2587890625, -4.828369140625, -4.39794921875, -3.967529296875, -3.537109375, -3.106689453125, -2.67626953125, -2.245849609375, -1.8154296875, -1.385009765625, -0.95458984375, -0.524169921875, -0.09375, 0.336669921875, 0.76708984375, 1.197509765625, 1.6279296875, 2.058349609375, 2.48876953125, 2.919189453125, 3.349609375, 3.780029296875, 4.21044921875, 4.640869140625, 5.0712890625, 5.501708984375, 5.93212890625, 6.362548828125, 6.79296875, 7.223388671875, 7.65380859375, 8.084228515625, 8.5146484375, 8.945068359375, 9.37548828125, 9.805908203125, 10.236328125, 10.666748046875, 11.09716796875, 11.527587890625, 11.9580078125, 12.388427734375, 12.81884765625, 13.249267578125, 13.6796875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 8.0, 21.0, 12.0, 39.0, 67.0, 114.0, 219.0, 343.0, 519.0, 692.0, 683.0, 498.0, 351.0, 208.0, 119.0, 55.0, 42.0, 33.0, 14.0, 9.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.24932861328125, -6.0181884765625, -5.78704833984375, -5.555908203125, -5.32476806640625, -5.0936279296875, -4.86248779296875, -4.63134765625, -4.40020751953125, -4.1690673828125, -3.93792724609375, -3.706787109375, -3.47564697265625, -3.2445068359375, -3.01336669921875, -2.7822265625, -2.55108642578125, -2.3199462890625, -2.08880615234375, -1.857666015625, -1.62652587890625, -1.3953857421875, -1.16424560546875, -0.93310546875, -0.70196533203125, -0.4708251953125, -0.23968505859375, -0.008544921875, 0.22259521484375, 0.4537353515625, 0.68487548828125, 0.916015625, 1.14715576171875, 1.3782958984375, 1.60943603515625, 1.840576171875, 2.07171630859375, 2.3028564453125, 2.53399658203125, 2.76513671875, 2.99627685546875, 3.2274169921875, 3.45855712890625, 3.689697265625, 3.92083740234375, 4.1519775390625, 4.38311767578125, 4.6142578125, 4.84539794921875, 5.0765380859375, 5.30767822265625, 5.538818359375, 5.76995849609375, 6.0010986328125, 6.23223876953125, 6.46337890625, 6.69451904296875, 6.9256591796875, 7.15679931640625, 7.387939453125, 7.61907958984375, 7.8502197265625, 8.08135986328125, 8.3125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 33.0, 78.0, 159.0, 337.0, 888.0, 2663.0, 12596.0, 203240.0, 3330440.0, 612939.0, 24824.0, 3969.0, 1261.0, 453.0, 176.0, 90.0, 40.0, 23.0, 14.0, 9.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.46893310546875, -9.1956787109375, -8.92242431640625, -8.649169921875, -8.37591552734375, -8.1026611328125, -7.82940673828125, -7.55615234375, -7.28289794921875, -7.0096435546875, -6.73638916015625, -6.463134765625, -6.18988037109375, -5.9166259765625, -5.64337158203125, -5.3701171875, -5.09686279296875, -4.8236083984375, -4.55035400390625, -4.277099609375, -4.00384521484375, -3.7305908203125, -3.45733642578125, -3.18408203125, -2.91082763671875, -2.6375732421875, -2.36431884765625, -2.091064453125, -1.81781005859375, -1.5445556640625, -1.27130126953125, -0.998046875, -0.72479248046875, -0.4515380859375, -0.17828369140625, 0.094970703125, 0.36822509765625, 0.6414794921875, 0.91473388671875, 1.18798828125, 1.46124267578125, 1.7344970703125, 2.00775146484375, 2.281005859375, 2.55426025390625, 2.8275146484375, 3.10076904296875, 3.3740234375, 3.64727783203125, 3.9205322265625, 4.19378662109375, 4.467041015625, 4.74029541015625, 5.0135498046875, 5.28680419921875, 5.56005859375, 5.83331298828125, 6.1065673828125, 6.37982177734375, 6.653076171875, 6.92633056640625, 7.1995849609375, 7.47283935546875, 7.74609375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 4.0, 12.0, 17.0, 20.0, 32.0, 39.0, 47.0, 77.0, 93.0, 81.0, 100.0, 99.0, 84.0, 74.0, 61.0, 55.0, 30.0, 27.0, 20.0, 10.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.791250228881836, -22.712310791015625, -21.63336944580078, -20.55443000793457, -19.475488662719727, -18.396549224853516, -17.317607879638672, -16.23866844177246, -15.159728050231934, -14.080787658691406, -13.001847267150879, -11.922906875610352, -10.84396743774414, -9.765026092529297, -8.686086654663086, -7.607146263122559, -6.528205871582031, -5.449265480041504, -4.370325088500977, -3.2913851737976074, -2.21244478225708, -1.1335043907165527, -0.054564476013183594, 1.0243759155273438, 2.103316307067871, 3.1822566986083984, 4.261197090148926, 5.340137004852295, 6.419077396392822, 7.49801778793335, 8.576957702636719, 9.655898094177246, 10.73483657836914, 11.813776969909668, 12.892717361450195, 13.971656799316406, 15.05059814453125, 16.12953758239746, 17.208477020263672, 18.287418365478516, 19.36635971069336, 20.44529914855957, 21.524240493774414, 22.603179931640625, 23.68212127685547, 24.76106071472168, 25.84000015258789, 26.918941497802734, 27.997880935668945, 29.076820373535156, 30.15576171875, 31.23470115661621, 32.31364059448242, 33.392581939697266, 34.47152328491211, 35.55046081542969, 36.62940216064453, 37.708343505859375, 38.78728103637695, 39.8662223815918, 40.94516372680664, 42.024105072021484, 43.10304260253906, 44.181983947753906, 45.26092529296875]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 3.0, 6.0, 7.0, 3.0, 7.0, 11.0, 14.0, 12.0, 16.0, 11.0, 22.0, 24.0, 24.0, 25.0, 31.0, 34.0, 29.0, 32.0, 42.0, 40.0, 36.0, 33.0, 31.0, 51.0, 31.0, 45.0, 43.0, 29.0, 32.0, 36.0, 32.0, 27.0, 28.0, 19.0, 21.0, 23.0, 14.0, 9.0, 13.0, 12.0, 14.0, 5.0, 4.0, 6.0, 3.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.31160545349121, -16.7670841217041, -16.222562789916992, -15.678041458129883, -15.133520126342773, -14.588998794555664, -14.044477462768555, -13.499956130981445, -12.955434799194336, -12.410913467407227, -11.866392135620117, -11.321870803833008, -10.777349472045898, -10.232828140258789, -9.68830680847168, -9.14378547668457, -8.599264144897461, -8.054742813110352, -7.510221481323242, -6.965700149536133, -6.421178817749023, -5.876657485961914, -5.332136154174805, -4.787614822387695, -4.243093490600586, -3.6985721588134766, -3.154050827026367, -2.609529495239258, -2.0650081634521484, -1.520486831665039, -0.9759654998779297, -0.4314441680908203, 0.11307525634765625, 0.6575965881347656, 1.202117919921875, 1.7466392517089844, 2.2911605834960938, 2.835681915283203, 3.3802032470703125, 3.924724578857422, 4.469245910644531, 5.013767242431641, 5.55828857421875, 6.102809906005859, 6.647331237792969, 7.191852569580078, 7.7363739013671875, 8.280895233154297, 8.825416564941406, 9.369937896728516, 9.914459228515625, 10.458980560302734, 11.003501892089844, 11.548023223876953, 12.092544555664062, 12.637065887451172, 13.181587219238281, 13.72610855102539, 14.2706298828125, 14.81515121459961, 15.359672546386719, 15.904193878173828, 16.448715209960938, 16.993236541748047, 17.537757873535156]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 4.0, 14.0, 11.0, 15.0, 18.0, 17.0, 15.0, 14.0, 29.0, 23.0, 33.0, 22.0, 45.0, 36.0, 29.0, 37.0, 45.0, 40.0, 57.0, 40.0, 31.0, 51.0, 58.0, 23.0, 32.0, 34.0, 30.0, 28.0, 19.0, 21.0, 28.0, 11.0, 13.0, 9.0, 7.0, 16.0, 4.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.921875, -26.943603515625, -25.96533203125, -24.987060546875, -24.0087890625, -23.030517578125, -22.05224609375, -21.073974609375, -20.095703125, -19.117431640625, -18.13916015625, -17.160888671875, -16.1826171875, -15.204345703125, -14.22607421875, -13.247802734375, -12.26953125, -11.291259765625, -10.31298828125, -9.334716796875, -8.3564453125, -7.378173828125, -6.39990234375, -5.421630859375, -4.443359375, -3.465087890625, -2.48681640625, -1.508544921875, -0.5302734375, 0.447998046875, 1.42626953125, 2.404541015625, 3.3828125, 4.361083984375, 5.33935546875, 6.317626953125, 7.2958984375, 8.274169921875, 9.25244140625, 10.230712890625, 11.208984375, 12.187255859375, 13.16552734375, 14.143798828125, 15.1220703125, 16.100341796875, 17.07861328125, 18.056884765625, 19.03515625, 20.013427734375, 20.99169921875, 21.969970703125, 22.9482421875, 23.926513671875, 24.90478515625, 25.883056640625, 26.861328125, 27.839599609375, 28.81787109375, 29.796142578125, 30.7744140625, 31.752685546875, 32.73095703125, 33.709228515625, 34.6875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 8.0, 14.0, 17.0, 28.0, 48.0, 66.0, 110.0, 165.0, 249.0, 463.0, 669.0, 922.0, 1391.0, 2345.0, 3662.0, 5468.0, 8726.0, 14063.0, 23602.0, 40258.0, 73807.0, 147554.0, 302451.0, 200865.0, 96261.0, 50466.0, 28794.0, 17190.0, 10479.0, 6676.0, 4060.0, 2702.0, 1822.0, 1092.0, 715.0, 499.0, 302.0, 179.0, 118.0, 87.0, 63.0, 28.0, 30.0, 23.0, 10.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.6990966796875, -5.519287109375, -5.3394775390625, -5.15966796875, -4.9798583984375, -4.800048828125, -4.6202392578125, -4.4404296875, -4.2606201171875, -4.080810546875, -3.9010009765625, -3.72119140625, -3.5413818359375, -3.361572265625, -3.1817626953125, -3.001953125, -2.8221435546875, -2.642333984375, -2.4625244140625, -2.28271484375, -2.1029052734375, -1.923095703125, -1.7432861328125, -1.5634765625, -1.3836669921875, -1.203857421875, -1.0240478515625, -0.84423828125, -0.6644287109375, -0.484619140625, -0.3048095703125, -0.125, 0.0548095703125, 0.234619140625, 0.4144287109375, 0.59423828125, 0.7740478515625, 0.953857421875, 1.1336669921875, 1.3134765625, 1.4932861328125, 1.673095703125, 1.8529052734375, 2.03271484375, 2.2125244140625, 2.392333984375, 2.5721435546875, 2.751953125, 2.9317626953125, 3.111572265625, 3.2913818359375, 3.47119140625, 3.6510009765625, 3.830810546875, 4.0106201171875, 4.1904296875, 4.3702392578125, 4.550048828125, 4.7298583984375, 4.90966796875, 5.0894775390625, 5.269287109375, 5.4490966796875, 5.62890625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 4.0, 11.0, 6.0, 4.0, 12.0, 17.0, 18.0, 21.0, 16.0, 22.0, 29.0, 29.0, 29.0, 34.0, 39.0, 34.0, 46.0, 33.0, 48.0, 1068.0, 49.0, 40.0, 43.0, 36.0, 43.0, 28.0, 34.0, 36.0, 29.0, 19.0, 25.0, 22.0, 17.0, 17.0, 13.0, 9.0, 6.0, 5.0, 7.0, 6.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.34375, -20.691650390625, -20.03955078125, -19.387451171875, -18.7353515625, -18.083251953125, -17.43115234375, -16.779052734375, -16.126953125, -15.474853515625, -14.82275390625, -14.170654296875, -13.5185546875, -12.866455078125, -12.21435546875, -11.562255859375, -10.91015625, -10.258056640625, -9.60595703125, -8.953857421875, -8.3017578125, -7.649658203125, -6.99755859375, -6.345458984375, -5.693359375, -5.041259765625, -4.38916015625, -3.737060546875, -3.0849609375, -2.432861328125, -1.78076171875, -1.128662109375, -0.4765625, 0.175537109375, 0.82763671875, 1.479736328125, 2.1318359375, 2.783935546875, 3.43603515625, 4.088134765625, 4.740234375, 5.392333984375, 6.04443359375, 6.696533203125, 7.3486328125, 8.000732421875, 8.65283203125, 9.304931640625, 9.95703125, 10.609130859375, 11.26123046875, 11.913330078125, 12.5654296875, 13.217529296875, 13.86962890625, 14.521728515625, 15.173828125, 15.825927734375, 16.47802734375, 17.130126953125, 17.7822265625, 18.434326171875, 19.08642578125, 19.738525390625, 20.390625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 16.0, 23.0, 35.0, 49.0, 55.0, 99.0, 162.0, 217.0, 321.0, 508.0, 687.0, 1065.0, 1579.0, 2322.0, 3660.0, 5395.0, 8166.0, 12834.0, 20597.0, 33534.0, 56769.0, 105535.0, 227770.0, 1324464.0, 123657.0, 66084.0, 37531.0, 22742.0, 14414.0, 9000.0, 5921.0, 3851.0, 2562.0, 1796.0, 1213.0, 833.0, 537.0, 368.0, 249.0, 176.0, 112.0, 69.0, 49.0, 29.0, 25.0, 18.0, 5.0, 10.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.78094482421875, -5.6009521484375, -5.42095947265625, -5.240966796875, -5.06097412109375, -4.8809814453125, -4.70098876953125, -4.52099609375, -4.34100341796875, -4.1610107421875, -3.98101806640625, -3.801025390625, -3.62103271484375, -3.4410400390625, -3.26104736328125, -3.0810546875, -2.90106201171875, -2.7210693359375, -2.54107666015625, -2.361083984375, -2.18109130859375, -2.0010986328125, -1.82110595703125, -1.64111328125, -1.46112060546875, -1.2811279296875, -1.10113525390625, -0.921142578125, -0.74114990234375, -0.5611572265625, -0.38116455078125, -0.201171875, -0.02117919921875, 0.1588134765625, 0.33880615234375, 0.518798828125, 0.69879150390625, 0.8787841796875, 1.05877685546875, 1.23876953125, 1.41876220703125, 1.5987548828125, 1.77874755859375, 1.958740234375, 2.13873291015625, 2.3187255859375, 2.49871826171875, 2.6787109375, 2.85870361328125, 3.0386962890625, 3.21868896484375, 3.398681640625, 3.57867431640625, 3.7586669921875, 3.93865966796875, 4.11865234375, 4.29864501953125, 4.4786376953125, 4.65863037109375, 4.838623046875, 5.01861572265625, 5.1986083984375, 5.37860107421875, 5.55859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 12.0, 17.0, 16.0, 26.0, 19.0, 35.0, 36.0, 45.0, 53.0, 52.0, 55.0, 64.0, 79.0, 77.0, 71.0, 51.0, 49.0, 42.0, 42.0, 27.0, 23.0, 21.0, 9.0, 12.0, 16.0, 10.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00528717041015625, -0.005140960216522217, -0.004994750022888184, -0.00484853982925415, -0.004702329635620117, -0.004556119441986084, -0.004409909248352051, -0.004263699054718018, -0.004117488861083984, -0.003971278667449951, -0.003825068473815918, -0.0036788582801818848, -0.0035326480865478516, -0.0033864378929138184, -0.003240227699279785, -0.003094017505645752, -0.0029478073120117188, -0.0028015971183776855, -0.0026553869247436523, -0.002509176731109619, -0.002362966537475586, -0.0022167563438415527, -0.0020705461502075195, -0.0019243359565734863, -0.0017781257629394531, -0.00163191556930542, -0.0014857053756713867, -0.0013394951820373535, -0.0011932849884033203, -0.0010470747947692871, -0.0009008646011352539, -0.0007546544075012207, -0.0006084442138671875, -0.0004622340202331543, -0.0003160238265991211, -0.0001698136329650879, -2.3603439331054688e-05, 0.00012260675430297852, 0.0002688169479370117, 0.0004150271415710449, 0.0005612373352050781, 0.0007074475288391113, 0.0008536577224731445, 0.0009998679161071777, 0.001146078109741211, 0.0012922883033752441, 0.0014384984970092773, 0.0015847086906433105, 0.0017309188842773438, 0.001877129077911377, 0.00202333927154541, 0.0021695494651794434, 0.0023157596588134766, 0.0024619698524475098, 0.002608180046081543, 0.002754390239715576, 0.0029006004333496094, 0.0030468106269836426, 0.0031930208206176758, 0.003339231014251709, 0.003485441207885742, 0.0036316514015197754, 0.0037778615951538086, 0.003924071788787842, 0.004070281982421875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 15.0, 14.0, 16.0, 22.0, 23.0, 31.0, 54.0, 72.0, 91.0, 126.0, 171.0, 321.0, 482.0, 872.0, 1811.0, 4464.0, 14140.0, 55196.0, 235312.0, 466138.0, 201889.0, 47090.0, 12188.0, 4105.0, 1719.0, 794.0, 490.0, 279.0, 197.0, 116.0, 91.0, 60.0, 41.0, 34.0, 18.0, 16.0, 16.0, 6.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0227508544921875, -0.021978139877319336, -0.021205425262451172, -0.020432710647583008, -0.019659996032714844, -0.01888728141784668, -0.018114566802978516, -0.01734185218811035, -0.016569137573242188, -0.015796422958374023, -0.01502370834350586, -0.014250993728637695, -0.013478279113769531, -0.012705564498901367, -0.011932849884033203, -0.011160135269165039, -0.010387420654296875, -0.009614706039428711, -0.008841991424560547, -0.008069276809692383, -0.007296562194824219, -0.006523847579956055, -0.005751132965087891, -0.0049784183502197266, -0.0042057037353515625, -0.0034329891204833984, -0.0026602745056152344, -0.0018875598907470703, -0.0011148452758789062, -0.0003421306610107422, 0.0004305839538574219, 0.001203298568725586, 0.00197601318359375, 0.002748727798461914, 0.003521442413330078, 0.004294157028198242, 0.005066871643066406, 0.00583958625793457, 0.006612300872802734, 0.0073850154876708984, 0.008157730102539062, 0.008930444717407227, 0.00970315933227539, 0.010475873947143555, 0.011248588562011719, 0.012021303176879883, 0.012794017791748047, 0.013566732406616211, 0.014339447021484375, 0.015112161636352539, 0.015884876251220703, 0.016657590866088867, 0.01743030548095703, 0.018203020095825195, 0.01897573471069336, 0.019748449325561523, 0.020521163940429688, 0.02129387855529785, 0.022066593170166016, 0.02283930778503418, 0.023612022399902344, 0.024384737014770508, 0.025157451629638672, 0.025930166244506836, 0.026702880859375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 11.0, 11.0, 19.0, 32.0, 48.0, 68.0, 94.0, 100.0, 120.0, 101.0, 109.0, 78.0, 64.0, 34.0, 40.0, 29.0, 21.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.005841652862727642, -0.00570902181789279, -0.005576390773057938, -0.005443759728223085, -0.005311128683388233, -0.005178498104214668, -0.005045866593718529, -0.004913236014544964, -0.004780604969710112, -0.004647973924875259, -0.004515342880040407, -0.004382711835205555, -0.004250080790370703, -0.0041174497455358505, -0.003984819166362286, -0.0038521878886967897, -0.0037195568438619375, -0.0035869257990270853, -0.003454294754192233, -0.0033216639421880245, -0.0031890328973531723, -0.00305640185251832, -0.002923770807683468, -0.0027911397628486156, -0.0026585087180137634, -0.002525877673178911, -0.002393246628344059, -0.0022606155835092068, -0.002127984771504998, -0.001995353726670146, -0.0018627226818352938, -0.0017300916370004416, -0.0015974610578268766, -0.0014648300129920244, -0.001332199084572494, -0.0011995680397376418, -0.0010669371113181114, -0.0009343060664832592, -0.000801675021648407, -0.0006690440350212157, -0.0005364130483940244, -0.00040378206176683307, -0.0002711510460358113, -0.00013852003030478954, -5.889043677598238e-06, 0.00012674194294959307, 0.0002593729877844453, 0.0003920039744116366, 0.0005246349610388279, 0.0006572659476660192, 0.0007898969342932105, 0.0009225279791280627, 0.0010551589075475931, 0.0011877899523824453, 0.0013204209972172976, 0.0014530520420521498, 0.0015856829704716802, 0.0017183140153065324, 0.0018509449437260628, 0.001983575988560915, 0.002116207033395767, 0.0022488380782306194, 0.0023814691230654716, 0.00251409993506968, 0.0026467309799045324]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 2.0, 9.0, 6.0, 9.0, 13.0, 16.0, 13.0, 24.0, 21.0, 23.0, 29.0, 29.0, 36.0, 23.0, 42.0, 51.0, 36.0, 40.0, 34.0, 28.0, 28.0, 42.0, 38.0, 40.0, 39.0, 31.0, 31.0, 29.0, 22.0, 36.0, 32.0, 19.0, 23.0, 14.0, 15.0, 14.0, 11.0, 13.0, 9.0, 8.0, 5.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.002259373664855957, -0.002196243032813072, -0.0021331124007701874, -0.0020699817687273026, -0.0020068511366844177, -0.001943720504641533, -0.001880589872598648, -0.0018174592405557632, -0.0017543286085128784, -0.0016911979764699936, -0.0016280673444271088, -0.001564936712384224, -0.0015018060803413391, -0.0014386754482984543, -0.0013755448162555695, -0.0013124141842126846, -0.0012492835521697998, -0.001186152920126915, -0.0011230222880840302, -0.0010598916560411453, -0.0009967610239982605, -0.0009336303919553757, -0.0008704997599124908, -0.000807369127869606, -0.0007442384958267212, -0.0006811078637838364, -0.0006179772317409515, -0.0005548465996980667, -0.0004917159676551819, -0.00042858533561229706, -0.00036545470356941223, -0.0003023240715265274, -0.00023919343948364258, -0.00017606280744075775, -0.00011293217539787292, -4.98015433549881e-05, 1.3329088687896729e-05, 7.645972073078156e-05, 0.00013959035277366638, 0.0002027209848165512, 0.00026585161685943604, 0.00032898224890232086, 0.0003921128809452057, 0.0004552435129880905, 0.0005183741450309753, 0.0005815047770738602, 0.000644635409116745, 0.0007077660411596298, 0.0007708966732025146, 0.0008340273052453995, 0.0008971579372882843, 0.0009602885693311691, 0.001023419201374054, 0.0010865498334169388, 0.0011496804654598236, 0.0012128110975027084, 0.0012759417295455933, 0.001339072361588478, 0.001402202993631363, 0.0014653336256742477, 0.0015284642577171326, 0.0015915948897600174, 0.0016547255218029022, 0.001717856153845787, 0.0017809867858886719]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 4.0, 14.0, 11.0, 15.0, 18.0, 17.0, 15.0, 14.0, 29.0, 23.0, 33.0, 22.0, 45.0, 36.0, 29.0, 36.0, 47.0, 39.0, 56.0, 41.0, 31.0, 52.0, 57.0, 23.0, 32.0, 34.0, 30.0, 28.0, 19.0, 21.0, 28.0, 11.0, 13.0, 9.0, 7.0, 16.0, 4.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.921875, -26.943603515625, -25.96533203125, -24.987060546875, -24.0087890625, -23.030517578125, -22.05224609375, -21.073974609375, -20.095703125, -19.117431640625, -18.13916015625, -17.160888671875, -16.1826171875, -15.204345703125, -14.22607421875, -13.247802734375, -12.26953125, -11.291259765625, -10.31298828125, -9.334716796875, -8.3564453125, -7.378173828125, -6.39990234375, -5.421630859375, -4.443359375, -3.465087890625, -2.48681640625, -1.508544921875, -0.5302734375, 0.447998046875, 1.42626953125, 2.404541015625, 3.3828125, 4.361083984375, 5.33935546875, 6.317626953125, 7.2958984375, 8.274169921875, 9.25244140625, 10.230712890625, 11.208984375, 12.187255859375, 13.16552734375, 14.143798828125, 15.1220703125, 16.100341796875, 17.07861328125, 18.056884765625, 19.03515625, 20.013427734375, 20.99169921875, 21.969970703125, 22.9482421875, 23.926513671875, 24.90478515625, 25.883056640625, 26.861328125, 27.839599609375, 28.81787109375, 29.796142578125, 30.7744140625, 31.752685546875, 32.73095703125, 33.709228515625, 34.6875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 5.0, 12.0, 14.0, 17.0, 22.0, 24.0, 34.0, 46.0, 76.0, 91.0, 145.0, 192.0, 310.0, 489.0, 731.0, 1219.0, 2363.0, 4613.0, 11635.0, 36784.0, 143490.0, 445502.0, 290560.0, 74457.0, 20669.0, 7377.0, 3242.0, 1744.0, 948.0, 546.0, 352.0, 269.0, 149.0, 113.0, 84.0, 48.0, 35.0, 38.0, 24.0, 12.0, 13.0, 17.0, 14.0, 12.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-5.7578125, -5.5872802734375, -5.416748046875, -5.2462158203125, -5.07568359375, -4.9051513671875, -4.734619140625, -4.5640869140625, -4.3935546875, -4.2230224609375, -4.052490234375, -3.8819580078125, -3.71142578125, -3.5408935546875, -3.370361328125, -3.1998291015625, -3.029296875, -2.8587646484375, -2.688232421875, -2.5177001953125, -2.34716796875, -2.1766357421875, -2.006103515625, -1.8355712890625, -1.6650390625, -1.4945068359375, -1.323974609375, -1.1534423828125, -0.98291015625, -0.8123779296875, -0.641845703125, -0.4713134765625, -0.30078125, -0.1302490234375, 0.040283203125, 0.2108154296875, 0.38134765625, 0.5518798828125, 0.722412109375, 0.8929443359375, 1.0634765625, 1.2340087890625, 1.404541015625, 1.5750732421875, 1.74560546875, 1.9161376953125, 2.086669921875, 2.2572021484375, 2.427734375, 2.5982666015625, 2.768798828125, 2.9393310546875, 3.10986328125, 3.2803955078125, 3.450927734375, 3.6214599609375, 3.7919921875, 3.9625244140625, 4.133056640625, 4.3035888671875, 4.47412109375, 4.6446533203125, 4.815185546875, 4.9857177734375, 5.15625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 6.0, 11.0, 14.0, 8.0, 14.0, 23.0, 29.0, 33.0, 52.0, 59.0, 58.0, 79.0, 83.0, 2109.0, 86.0, 59.0, 57.0, 57.0, 44.0, 35.0, 26.0, 25.0, 25.0, 15.0, 10.0, 9.0, 6.0, 13.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-77.3125, -75.005859375, -72.69921875, -70.392578125, -68.0859375, -65.779296875, -63.47265625, -61.166015625, -58.859375, -56.552734375, -54.24609375, -51.939453125, -49.6328125, -47.326171875, -45.01953125, -42.712890625, -40.40625, -38.099609375, -35.79296875, -33.486328125, -31.1796875, -28.873046875, -26.56640625, -24.259765625, -21.953125, -19.646484375, -17.33984375, -15.033203125, -12.7265625, -10.419921875, -8.11328125, -5.806640625, -3.5, -1.193359375, 1.11328125, 3.419921875, 5.7265625, 8.033203125, 10.33984375, 12.646484375, 14.953125, 17.259765625, 19.56640625, 21.873046875, 24.1796875, 26.486328125, 28.79296875, 31.099609375, 33.40625, 35.712890625, 38.01953125, 40.326171875, 42.6328125, 44.939453125, 47.24609375, 49.552734375, 51.859375, 54.166015625, 56.47265625, 58.779296875, 61.0859375, 63.392578125, 65.69921875, 68.005859375, 70.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 4.0, 8.0, 10.0, 15.0, 24.0, 28.0, 37.0, 42.0, 70.0, 100.0, 112.0, 213.0, 276.0, 383.0, 690.0, 1203.0, 2927.0, 13283.0, 159533.0, 2840473.0, 110032.0, 10586.0, 2629.0, 1151.0, 610.0, 364.0, 275.0, 155.0, 129.0, 95.0, 66.0, 41.0, 35.0, 25.0, 16.0, 20.0, 7.0, 7.0, 6.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.015625, -9.6865234375, -9.357421875, -9.0283203125, -8.69921875, -8.3701171875, -8.041015625, -7.7119140625, -7.3828125, -7.0537109375, -6.724609375, -6.3955078125, -6.06640625, -5.7373046875, -5.408203125, -5.0791015625, -4.75, -4.4208984375, -4.091796875, -3.7626953125, -3.43359375, -3.1044921875, -2.775390625, -2.4462890625, -2.1171875, -1.7880859375, -1.458984375, -1.1298828125, -0.80078125, -0.4716796875, -0.142578125, 0.1865234375, 0.515625, 0.8447265625, 1.173828125, 1.5029296875, 1.83203125, 2.1611328125, 2.490234375, 2.8193359375, 3.1484375, 3.4775390625, 3.806640625, 4.1357421875, 4.46484375, 4.7939453125, 5.123046875, 5.4521484375, 5.78125, 6.1103515625, 6.439453125, 6.7685546875, 7.09765625, 7.4267578125, 7.755859375, 8.0849609375, 8.4140625, 8.7431640625, 9.072265625, 9.4013671875, 9.73046875, 10.0595703125, 10.388671875, 10.7177734375, 11.046875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 14.0, 39.0, 76.0, 174.0, 246.0, 193.0, 118.0, 53.0, 28.0, 10.0, 9.0, 11.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.93960571289062, -114.4190902709961, -110.89857482910156, -107.37805938720703, -103.8575439453125, -100.33702850341797, -96.81651306152344, -93.2959976196289, -89.77548217773438, -86.25496673583984, -82.73445129394531, -79.21393585205078, -75.69342041015625, -72.17290496826172, -68.65238952636719, -65.13187408447266, -61.611358642578125, -58.090843200683594, -54.57032775878906, -51.04981231689453, -47.529296875, -44.00878143310547, -40.48826599121094, -36.967750549316406, -33.447235107421875, -29.926719665527344, -26.406204223632812, -22.88568878173828, -19.36517333984375, -15.844657897949219, -12.324142456054688, -8.803627014160156, -5.283103942871094, -1.7625885009765625, 1.7579269409179688, 5.2784423828125, 8.798957824707031, 12.319473266601562, 15.839988708496094, 19.360504150390625, 22.881019592285156, 26.401535034179688, 29.92205047607422, 33.44256591796875, 36.96308135986328, 40.48359680175781, 44.004112243652344, 47.524627685546875, 51.045143127441406, 54.56565856933594, 58.08617401123047, 61.606689453125, 65.12720489501953, 68.64772033691406, 72.1682357788086, 75.68875122070312, 79.20926666259766, 82.72978210449219, 86.25029754638672, 89.77081298828125, 93.29132843017578, 96.81184387207031, 100.33235931396484, 103.85287475585938, 107.3733901977539]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 4.0, 12.0, 7.0, 12.0, 21.0, 14.0, 18.0, 30.0, 34.0, 32.0, 23.0, 50.0, 39.0, 38.0, 48.0, 49.0, 59.0, 40.0, 48.0, 55.0, 44.0, 45.0, 41.0, 33.0, 37.0, 36.0, 22.0, 25.0, 21.0, 10.0, 12.0, 6.0, 6.0, 9.0, 6.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.462646484375, -57.190391540527344, -54.91813659667969, -52.6458854675293, -50.37363052368164, -48.101375579833984, -45.829124450683594, -43.55686950683594, -41.28461456298828, -39.012359619140625, -36.74010467529297, -34.46785354614258, -32.19559860229492, -29.923343658447266, -27.651090621948242, -25.37883758544922, -23.106582641601562, -20.834327697753906, -18.562074661254883, -16.28982162475586, -14.017566680908203, -11.745312690734863, -9.473058700561523, -7.200804710388184, -4.928550720214844, -2.656296730041504, -0.38404273986816406, 1.8882112503051758, 4.160465240478516, 6.4327192306518555, 8.704973220825195, 10.977227210998535, 13.249481201171875, 15.521735191345215, 17.793989181518555, 20.066242218017578, 22.338497161865234, 24.61075210571289, 26.883005142211914, 29.155258178710938, 31.427513122558594, 33.69976806640625, 35.972023010253906, 38.2442741394043, 40.51652908325195, 42.78878402709961, 45.06103515625, 47.333290100097656, 49.60554504394531, 51.87779998779297, 54.150054931640625, 56.422306060791016, 58.69456100463867, 60.96681594848633, 63.23906707763672, 65.51132202148438, 67.78357696533203, 70.05583190917969, 72.32808685302734, 74.600341796875, 76.87258911132812, 79.14484405517578, 81.41709899902344, 83.6893539428711, 85.96160888671875]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 11.0, 9.0, 16.0, 17.0, 18.0, 22.0, 40.0, 60.0, 81.0, 132.0, 166.0, 237.0, 369.0, 577.0, 812.0, 1174.0, 1797.0, 2694.0, 3717.0, 5189.0, 1006721.0, 7955.0, 5121.0, 3672.0, 2548.0, 1716.0, 1237.0, 764.0, 517.0, 348.0, 219.0, 173.0, 105.0, 90.0, 51.0, 48.0, 39.0, 21.0, 24.0, 11.0, 4.0, 7.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.675667762756348, -11.31039047241211, -10.945112228393555, -10.579834938049316, -10.214557647705078, -9.849279403686523, -9.484002113342285, -9.118724822998047, -8.753446578979492, -8.388169288635254, -8.0228910446167, -7.657613754272461, -7.2923359870910645, -6.927058219909668, -6.56178092956543, -6.196503162384033, -5.831225395202637, -5.46594762802124, -5.100669860839844, -4.7353925704956055, -4.370114803314209, -4.0048370361328125, -3.639559507369995, -3.2742819786071777, -2.9090042114257812, -2.5437264442443848, -2.1784489154815674, -1.8131712675094604, -1.4478936195373535, -1.0826159715652466, -0.7173383235931396, -0.35206079483032227, 0.013217926025390625, 0.37849557399749756, 0.7437732219696045, 1.1090508699417114, 1.4743285179138184, 1.8396061658859253, 2.2048838138580322, 2.5701613426208496, 2.935439109802246, 3.3007168769836426, 3.66599440574646, 4.031271934509277, 4.396549701690674, 4.76182746887207, 5.127104759216309, 5.492382526397705, 5.857660293579102, 6.222938060760498, 6.5882158279418945, 6.953493118286133, 7.318770885467529, 7.684048652648926, 8.049325942993164, 8.414604187011719, 8.779881477355957, 9.145158767700195, 9.51043701171875, 9.875714302062988, 10.240991592407227, 10.606269836425781, 10.97154712677002, 11.336824417114258, 11.702102661132812]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 10.0, 12.0, 27.0, 52.0, 124.0, 158.0, 10998.0, 51452148.0, 182.0, 66.0, 58.0, 57.0, 31.0, 26.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5163.12060546875, -5030.8798828125, -4898.63916015625, -4766.39794921875, -4634.1572265625, -4501.91650390625, -4369.67578125, -4237.4345703125, -4105.19384765625, -3972.953125, -3840.712158203125, -3708.471435546875, -3576.23046875, -3443.98974609375, -3311.7490234375, -3179.508056640625, -3047.267333984375, -2915.026611328125, -2782.78564453125, -2650.544921875, -2518.303955078125, -2386.063232421875, -2253.822265625, -2121.58154296875, -1989.3406982421875, -1857.099853515625, -1724.8590087890625, -1592.6181640625, -1460.37744140625, -1328.136474609375, -1195.895751953125, -1063.6549072265625, -931.414306640625, -799.1734619140625, -666.9326171875, -534.6918334960938, -402.45098876953125, -270.21014404296875, -137.9693603515625, -5.728515625, 126.5123291015625, 258.753173828125, 390.9939880371094, 523.2348022460938, 655.4756469726562, 787.7164916992188, 919.957275390625, 1052.1981201171875, 1184.43896484375, 1316.6798095703125, 1448.920654296875, 1581.161376953125, 1713.40234375, 1845.64306640625, 1977.8839111328125, 2110.124755859375, 2242.36572265625, 2374.6064453125, 2506.847412109375, 2639.088134765625, 2771.3291015625, 2903.56982421875, 3035.810546875, 3168.051513671875, 3300.292236328125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [8.0, 4.0, 10.0, 15.0, 5.0, 21.0, 39.0, 59.0, 57.0, 110.0, 148.0, 231.0, 354.0, 476.0, 572.0, 768.0, 1119.0, 1700.0, 2510.0, 3661.0, 5277.0, 7544.0, 11175.0, 16182.0, 24880.0, 37421.0, 58824.0, 92086.0, 151729.0, 264004.0, 613418.0, 3900479.0, 481774.0, 233173.0, 137599.0, 84448.0, 54087.0, 34462.0, 22789.0, 14861.0, 10542.0, 6893.0, 4675.0, 3500.0, 2409.0, 1515.0, 1135.0, 811.0, 574.0, 405.0, 303.0, 198.0, 134.0, 80.0, 61.0, 33.0, 29.0, 28.0, 20.0, 11.0, 12.0, 3.0, 1.0, 5.0], "bins": [-2.548828125, -2.4676513671875, -2.386474609375, -2.3052978515625, -2.22412109375, -2.1429443359375, -2.061767578125, -1.9805908203125, -1.8994140625, -1.8182373046875, -1.737060546875, -1.6558837890625, -1.57470703125, -1.4935302734375, -1.412353515625, -1.3311767578125, -1.25, -1.1688232421875, -1.087646484375, -1.0064697265625, -0.92529296875, -0.8441162109375, -0.762939453125, -0.6817626953125, -0.6005859375, -0.5194091796875, -0.438232421875, -0.3570556640625, -0.27587890625, -0.1947021484375, -0.113525390625, -0.0323486328125, 0.048828125, 0.1300048828125, 0.211181640625, 0.2923583984375, 0.37353515625, 0.4547119140625, 0.535888671875, 0.6170654296875, 0.6982421875, 0.7794189453125, 0.860595703125, 0.9417724609375, 1.02294921875, 1.1041259765625, 1.185302734375, 1.2664794921875, 1.34765625, 1.4288330078125, 1.510009765625, 1.5911865234375, 1.67236328125, 1.7535400390625, 1.834716796875, 1.9158935546875, 1.9970703125, 2.0782470703125, 2.159423828125, 2.2406005859375, 2.32177734375, 2.4029541015625, 2.484130859375, 2.5653076171875, 2.646484375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 3.0, 9.0, 9.0, 7.0, 14.0, 14.0, 20.0, 26.0, 29.0, 34.0, 37.0, 34.0, 35.0, 43.0, 40.0, 42.0, 81.0, 366.0, 580.0, 124.0, 53.0, 54.0, 43.0, 38.0, 26.0, 32.0, 34.0, 21.0, 27.0, 29.0, 13.0, 15.0, 18.0, 12.0, 5.0, 7.0, 8.0, 7.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.66534423828125, -6.4439697265625, -6.22259521484375, -6.001220703125, -5.77984619140625, -5.5584716796875, -5.33709716796875, -5.11572265625, -4.89434814453125, -4.6729736328125, -4.45159912109375, -4.230224609375, -4.00885009765625, -3.7874755859375, -3.56610107421875, -3.3447265625, -3.12335205078125, -2.9019775390625, -2.68060302734375, -2.459228515625, -2.23785400390625, -2.0164794921875, -1.79510498046875, -1.57373046875, -1.35235595703125, -1.1309814453125, -0.90960693359375, -0.688232421875, -0.46685791015625, -0.2454833984375, -0.02410888671875, 0.197265625, 0.41864013671875, 0.6400146484375, 0.86138916015625, 1.082763671875, 1.30413818359375, 1.5255126953125, 1.74688720703125, 1.96826171875, 2.18963623046875, 2.4110107421875, 2.63238525390625, 2.853759765625, 3.07513427734375, 3.2965087890625, 3.51788330078125, 3.7392578125, 3.96063232421875, 4.1820068359375, 4.40338134765625, 4.624755859375, 4.84613037109375, 5.0675048828125, 5.28887939453125, 5.51025390625, 5.73162841796875, 5.9530029296875, 6.17437744140625, 6.395751953125, 6.61712646484375, 6.8385009765625, 7.05987548828125, 7.28125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [9.0, 0.0, 0.0, 12.0, 19.0, 14.0, 27.0, 19.0, 33.0, 62.0, 32.0, 71.0, 159.0, 175.0, 219.0, 311.0, 532.0, 678.0, 1058.0, 1566.0, 2353.0, 3170.0, 4743.0, 7200.0, 11652.0, 18402.0, 29579.0, 47705.0, 78133.0, 135718.0, 252716.0, 667276.0, 3942583.0, 540929.0, 228047.0, 123315.0, 72449.0, 44030.0, 27363.0, 16878.0, 10908.0, 6918.0, 4638.0, 3016.0, 2103.0, 1391.0, 976.0, 658.0, 474.0, 339.0, 214.0, 152.0, 103.0, 90.0, 67.0, 49.0, 51.0, 24.0, 0.0, 22.0, 4.0, 4.0, 5.0, 13.0], "bins": [-3.228515625, -3.128936767578125, -3.02935791015625, -2.929779052734375, -2.8302001953125, -2.730621337890625, -2.63104248046875, -2.531463623046875, -2.431884765625, -2.332305908203125, -2.23272705078125, -2.133148193359375, -2.0335693359375, -1.933990478515625, -1.83441162109375, -1.734832763671875, -1.63525390625, -1.535675048828125, -1.43609619140625, -1.336517333984375, -1.2369384765625, -1.137359619140625, -1.03778076171875, -0.938201904296875, -0.838623046875, -0.739044189453125, -0.63946533203125, -0.539886474609375, -0.4403076171875, -0.340728759765625, -0.24114990234375, -0.141571044921875, -0.0419921875, 0.057586669921875, 0.15716552734375, 0.256744384765625, 0.3563232421875, 0.455902099609375, 0.55548095703125, 0.655059814453125, 0.754638671875, 0.854217529296875, 0.95379638671875, 1.053375244140625, 1.1529541015625, 1.252532958984375, 1.35211181640625, 1.451690673828125, 1.55126953125, 1.650848388671875, 1.75042724609375, 1.850006103515625, 1.9495849609375, 2.049163818359375, 2.14874267578125, 2.248321533203125, 2.347900390625, 2.447479248046875, 2.54705810546875, 2.646636962890625, 2.7462158203125, 2.845794677734375, 2.94537353515625, 3.044952392578125, 3.14453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 4.0, 11.0, 5.0, 6.0, 22.0, 13.0, 19.0, 15.0, 27.0, 40.0, 26.0, 30.0, 37.0, 46.0, 46.0, 52.0, 104.0, 354.0, 530.0, 162.0, 70.0, 54.0, 52.0, 44.0, 39.0, 33.0, 23.0, 22.0, 20.0, 28.0, 16.0, 18.0, 12.0, 16.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.44232177734375, -5.2674560546875, -5.09259033203125, -4.917724609375, -4.74285888671875, -4.5679931640625, -4.39312744140625, -4.21826171875, -4.04339599609375, -3.8685302734375, -3.69366455078125, -3.518798828125, -3.34393310546875, -3.1690673828125, -2.99420166015625, -2.8193359375, -2.64447021484375, -2.4696044921875, -2.29473876953125, -2.119873046875, -1.94500732421875, -1.7701416015625, -1.59527587890625, -1.42041015625, -1.24554443359375, -1.0706787109375, -0.89581298828125, -0.720947265625, -0.54608154296875, -0.3712158203125, -0.19635009765625, -0.021484375, 0.15338134765625, 0.3282470703125, 0.50311279296875, 0.677978515625, 0.85284423828125, 1.0277099609375, 1.20257568359375, 1.37744140625, 1.55230712890625, 1.7271728515625, 1.90203857421875, 2.076904296875, 2.25177001953125, 2.4266357421875, 2.60150146484375, 2.7763671875, 2.95123291015625, 3.1260986328125, 3.30096435546875, 3.475830078125, 3.65069580078125, 3.8255615234375, 4.00042724609375, 4.17529296875, 4.35015869140625, 4.5250244140625, 4.69989013671875, 4.874755859375, 5.04962158203125, 5.2244873046875, 5.39935302734375, 5.57421875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 12.0, 6.0, 5.0, 14.0, 27.0, 37.0, 22.0, 33.0, 53.0, 57.0, 55.0, 97.0, 132.0, 117.0, 186.0, 255.0, 349.0, 499.0, 636.0, 806.0, 1258.0, 1856.0, 2673.0, 4456.0, 7543.0, 15317.0, 36407.0, 146945.0, 5910017.0, 99779.0, 29770.0, 12836.0, 6789.0, 3880.0, 2571.0, 1683.0, 1107.0, 821.0, 580.0, 396.0, 344.0, 252.0, 187.0, 131.0, 76.0, 77.0, 59.0, 45.0, 54.0, 46.0, 31.0, 18.0, 10.0, 9.0, 5.0, 8.0, 2.0, 9.0, 0.0, 6.0], "bins": [-9.296875, -9.0098876953125, -8.722900390625, -8.4359130859375, -8.14892578125, -7.8619384765625, -7.574951171875, -7.2879638671875, -7.0009765625, -6.7139892578125, -6.427001953125, -6.1400146484375, -5.85302734375, -5.5660400390625, -5.279052734375, -4.9920654296875, -4.705078125, -4.4180908203125, -4.131103515625, -3.8441162109375, -3.55712890625, -3.2701416015625, -2.983154296875, -2.6961669921875, -2.4091796875, -2.1221923828125, -1.835205078125, -1.5482177734375, -1.26123046875, -0.9742431640625, -0.687255859375, -0.4002685546875, -0.11328125, 0.1737060546875, 0.460693359375, 0.7476806640625, 1.03466796875, 1.3216552734375, 1.608642578125, 1.8956298828125, 2.1826171875, 2.4696044921875, 2.756591796875, 3.0435791015625, 3.33056640625, 3.6175537109375, 3.904541015625, 4.1915283203125, 4.478515625, 4.7655029296875, 5.052490234375, 5.3394775390625, 5.62646484375, 5.9134521484375, 6.200439453125, 6.4874267578125, 6.7744140625, 7.0614013671875, 7.348388671875, 7.6353759765625, 7.92236328125, 8.2093505859375, 8.496337890625, 8.7833251953125, 9.0703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 5.0, 2.0, 7.0, 9.0, 7.0, 11.0, 12.0, 10.0, 16.0, 15.0, 25.0, 20.0, 28.0, 34.0, 44.0, 41.0, 35.0, 49.0, 68.0, 133.0, 340.0, 415.0, 163.0, 85.0, 69.0, 44.0, 48.0, 36.0, 32.0, 29.0, 41.0, 24.0, 25.0, 13.0, 14.0, 10.0, 11.0, 6.0, 10.0, 8.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.416015625, -3.30609130859375, -3.1961669921875, -3.08624267578125, -2.976318359375, -2.86639404296875, -2.7564697265625, -2.64654541015625, -2.53662109375, -2.42669677734375, -2.3167724609375, -2.20684814453125, -2.096923828125, -1.98699951171875, -1.8770751953125, -1.76715087890625, -1.6572265625, -1.54730224609375, -1.4373779296875, -1.32745361328125, -1.217529296875, -1.10760498046875, -0.9976806640625, -0.88775634765625, -0.77783203125, -0.66790771484375, -0.5579833984375, -0.44805908203125, -0.338134765625, -0.22821044921875, -0.1182861328125, -0.00836181640625, 0.1015625, 0.21148681640625, 0.3214111328125, 0.43133544921875, 0.541259765625, 0.65118408203125, 0.7611083984375, 0.87103271484375, 0.98095703125, 1.09088134765625, 1.2008056640625, 1.31072998046875, 1.420654296875, 1.53057861328125, 1.6405029296875, 1.75042724609375, 1.8603515625, 1.97027587890625, 2.0802001953125, 2.19012451171875, 2.300048828125, 2.40997314453125, 2.5198974609375, 2.62982177734375, 2.73974609375, 2.84967041015625, 2.9595947265625, 3.06951904296875, 3.179443359375, 3.28936767578125, 3.3992919921875, 3.50921630859375, 3.619140625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 38.0, 75.0, 362.0, 398.0, 77.0, 30.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.866183280944824, -13.000533103942871, -12.134882926940918, -11.269231796264648, -10.403581619262695, -9.537931442260742, -8.672281265258789, -7.806630611419678, -6.940980434417725, -6.0753302574157715, -5.20967960357666, -4.344029426574707, -3.478379011154175, -2.6127285957336426, -1.7470784187316895, -0.8814277648925781, -0.015777587890625, 0.8498727679252625, 1.71552312374115, 2.5811734199523926, 3.446823835372925, 4.312474250793457, 5.17812442779541, 6.0437750816345215, 6.909425258636475, 7.775075435638428, 8.640726089477539, 9.506376266479492, 10.372026443481445, 11.237676620483398, 12.103326797485352, 12.968977928161621, 13.834627151489258, 14.700277328491211, 15.565927505493164, 16.431577682495117, 17.29722785949707, 18.162879943847656, 19.02853012084961, 19.894180297851562, 20.759830474853516, 21.62548065185547, 22.491130828857422, 23.356781005859375, 24.222431182861328, 25.08808135986328, 25.953731536865234, 26.81938362121582, 27.68503189086914, 28.550682067871094, 29.416332244873047, 30.281982421875, 31.147632598876953, 32.013282775878906, 32.87893295288086, 33.74458312988281, 34.61023712158203, 35.475887298583984, 36.34153747558594, 37.20718765258789, 38.072837829589844, 38.9384880065918, 39.80413818359375, 40.6697883605957, 41.535438537597656]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 9.0, 5.0, 9.0, 17.0, 12.0, 18.0, 16.0, 25.0, 14.0, 30.0, 39.0, 24.0, 28.0, 43.0, 33.0, 45.0, 22.0, 39.0, 44.0, 47.0, 42.0, 43.0, 35.0, 36.0, 34.0, 32.0, 37.0, 27.0, 28.0, 18.0, 21.0, 24.0, 14.0, 19.0, 11.0, 17.0, 13.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.966644763946533, -4.810634613037109, -4.6546244621276855, -4.498614311218262, -4.342604637145996, -4.186594486236572, -4.030584335327148, -3.8745741844177246, -3.718564033508301, -3.562553882598877, -3.406543731689453, -3.2505338191986084, -3.0945236682891846, -2.9385135173797607, -2.782503604888916, -2.626493453979492, -2.4704833030700684, -2.3144731521606445, -2.1584630012512207, -2.002453088760376, -1.8464429378509521, -1.6904327869415283, -1.534422755241394, -1.3784127235412598, -1.222402572631836, -1.066392421722412, -0.9103823900222778, -0.7543722987174988, -0.5983622074127197, -0.4423521161079407, -0.2863420248031616, -0.13033199310302734, 0.02567768096923828, 0.18168777227401733, 0.3376978635787964, 0.49370795488357544, 0.6497180461883545, 0.8057281374931335, 0.9617382287979126, 1.1177482604980469, 1.2737584114074707, 1.4297685623168945, 1.5857785940170288, 1.741788625717163, 1.897798776626587, 2.0538089275360107, 2.2098188400268555, 2.3658289909362793, 2.521839141845703, 2.677849292755127, 2.833859443664551, 2.9898693561553955, 3.1458795070648193, 3.301889657974243, 3.457899570465088, 3.6139097213745117, 3.7699198722839355, 3.9259300231933594, 4.081940174102783, 4.237950325012207, 4.393959999084473, 4.5499701499938965, 4.70598030090332, 4.861990451812744, 5.018000602722168]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 3.0, 6.0, 9.0, 9.0, 11.0, 20.0, 32.0, 37.0, 31.0, 66.0, 76.0, 102.0, 129.0, 177.0, 288.0, 472.0, 663.0, 1149.0, 1865.0, 3293.0, 6333.0, 14010.0, 38173.0, 189674.0, 3824287.0, 73063.0, 21455.0, 8882.0, 4212.0, 2208.0, 1276.0, 795.0, 514.0, 321.0, 208.0, 119.0, 87.0, 61.0, 57.0, 45.0, 19.0, 13.0, 11.0, 4.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0255584716796875, -0.0248720645904541, -0.024185657501220703, -0.023499250411987305, -0.022812843322753906, -0.022126436233520508, -0.02144002914428711, -0.02075362205505371, -0.020067214965820312, -0.019380807876586914, -0.018694400787353516, -0.018007993698120117, -0.01732158660888672, -0.01663517951965332, -0.015948772430419922, -0.015262365341186523, -0.014575958251953125, -0.013889551162719727, -0.013203144073486328, -0.01251673698425293, -0.011830329895019531, -0.011143922805786133, -0.010457515716552734, -0.009771108627319336, -0.009084701538085938, -0.008398294448852539, -0.007711887359619141, -0.007025480270385742, -0.006339073181152344, -0.005652666091918945, -0.004966259002685547, -0.0042798519134521484, -0.00359344482421875, -0.0029070377349853516, -0.002220630645751953, -0.0015342235565185547, -0.0008478164672851562, -0.0001614093780517578, 0.0005249977111816406, 0.001211404800415039, 0.0018978118896484375, 0.002584218978881836, 0.0032706260681152344, 0.003957033157348633, 0.004643440246582031, 0.00532984733581543, 0.006016254425048828, 0.0067026615142822266, 0.007389068603515625, 0.008075475692749023, 0.008761882781982422, 0.00944828987121582, 0.010134696960449219, 0.010821104049682617, 0.011507511138916016, 0.012193918228149414, 0.012880325317382812, 0.013566732406616211, 0.01425313949584961, 0.014939546585083008, 0.015625953674316406, 0.016312360763549805, 0.016998767852783203, 0.0176851749420166, 0.01837158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 8.0, 3.0, 4.0, 8.0, 6.0, 5.0, 10.0, 12.0, 10.0, 11.0, 25.0, 780.0, 16.0, 14.0, 13.0, 9.0, 8.0, 6.0, 8.0, 5.0, 6.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004444122314453125, -0.004296720027923584, -0.004149317741394043, -0.004001915454864502, -0.003854513168334961, -0.00370711088180542, -0.003559708595275879, -0.003412306308746338, -0.003264904022216797, -0.003117501735687256, -0.002970099449157715, -0.002822697162628174, -0.002675294876098633, -0.002527892589569092, -0.0023804903030395508, -0.0022330880165100098, -0.0020856857299804688, -0.0019382834434509277, -0.0017908811569213867, -0.0016434788703918457, -0.0014960765838623047, -0.0013486742973327637, -0.0012012720108032227, -0.0010538697242736816, -0.0009064674377441406, -0.0007590651512145996, -0.0006116628646850586, -0.0004642605781555176, -0.00031685829162597656, -0.00016945600509643555, -2.205371856689453e-05, 0.00012534856796264648, 0.0002727508544921875, 0.0004201531410217285, 0.0005675554275512695, 0.0007149577140808105, 0.0008623600006103516, 0.0010097622871398926, 0.0011571645736694336, 0.0013045668601989746, 0.0014519691467285156, 0.0015993714332580566, 0.0017467737197875977, 0.0018941760063171387, 0.0020415782928466797, 0.0021889805793762207, 0.0023363828659057617, 0.0024837851524353027, 0.0026311874389648438, 0.0027785897254943848, 0.0029259920120239258, 0.003073394298553467, 0.003220796585083008, 0.003368198871612549, 0.00351560115814209, 0.003663003444671631, 0.003810405731201172, 0.003957808017730713, 0.004105210304260254, 0.004252612590789795, 0.004400014877319336, 0.004547417163848877, 0.004694819450378418, 0.004842221736907959, 0.0049896240234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 4.0, 9.0, 7.0, 5.0, 18.0, 29.0, 49.0, 91.0, 146.0, 302.0, 786.0, 2859.0, 16661.0, 208067.0, 3694681.0, 247930.0, 18163.0, 2937.0, 807.0, 339.0, 143.0, 91.0, 49.0, 25.0, 18.0, 13.0, 14.0, 5.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.039825439453125, -0.03870439529418945, -0.037583351135253906, -0.03646230697631836, -0.03534126281738281, -0.034220218658447266, -0.03309917449951172, -0.03197813034057617, -0.030857086181640625, -0.029736042022705078, -0.02861499786376953, -0.027493953704833984, -0.026372909545898438, -0.02525186538696289, -0.024130821228027344, -0.023009777069091797, -0.02188873291015625, -0.020767688751220703, -0.019646644592285156, -0.01852560043334961, -0.017404556274414062, -0.016283512115478516, -0.015162467956542969, -0.014041423797607422, -0.012920379638671875, -0.011799335479736328, -0.010678291320800781, -0.009557247161865234, -0.008436203002929688, -0.007315158843994141, -0.006194114685058594, -0.005073070526123047, -0.0039520263671875, -0.002830982208251953, -0.0017099380493164062, -0.0005888938903808594, 0.0005321502685546875, 0.0016531944274902344, 0.0027742385864257812, 0.003895282745361328, 0.005016326904296875, 0.006137371063232422, 0.007258415222167969, 0.008379459381103516, 0.009500503540039062, 0.01062154769897461, 0.011742591857910156, 0.012863636016845703, 0.01398468017578125, 0.015105724334716797, 0.016226768493652344, 0.01734781265258789, 0.018468856811523438, 0.019589900970458984, 0.02071094512939453, 0.021831989288330078, 0.022953033447265625, 0.024074077606201172, 0.02519512176513672, 0.026316165924072266, 0.027437210083007812, 0.02855825424194336, 0.029679298400878906, 0.030800342559814453, 0.03192138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 8.0, 3.0, 12.0, 10.0, 16.0, 22.0, 23.0, 35.0, 62.0, 78.0, 117.0, 166.0, 240.0, 431.0, 820.0, 828.0, 407.0, 256.0, 139.0, 114.0, 74.0, 54.0, 43.0, 39.0, 26.0, 12.0, 17.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00598907470703125, -0.005775034427642822, -0.0055609941482543945, -0.005346953868865967, -0.005132913589477539, -0.004918873310089111, -0.004704833030700684, -0.004490792751312256, -0.004276752471923828, -0.0040627121925354, -0.0038486719131469727, -0.003634631633758545, -0.003420591354370117, -0.0032065510749816895, -0.0029925107955932617, -0.002778470516204834, -0.0025644302368164062, -0.0023503899574279785, -0.0021363496780395508, -0.001922309398651123, -0.0017082691192626953, -0.0014942288398742676, -0.0012801885604858398, -0.0010661482810974121, -0.0008521080017089844, -0.0006380677223205566, -0.0004240274429321289, -0.00020998716354370117, 4.0531158447265625e-06, 0.0002180933952331543, 0.00043213367462158203, 0.0006461739540100098, 0.0008602142333984375, 0.0010742545127868652, 0.001288294792175293, 0.0015023350715637207, 0.0017163753509521484, 0.0019304156303405762, 0.002144455909729004, 0.0023584961891174316, 0.0025725364685058594, 0.002786576747894287, 0.003000617027282715, 0.0032146573066711426, 0.0034286975860595703, 0.003642737865447998, 0.0038567781448364258, 0.0040708184242248535, 0.004284858703613281, 0.004498898983001709, 0.004712939262390137, 0.0049269795417785645, 0.005141019821166992, 0.00535506010055542, 0.005569100379943848, 0.005783140659332275, 0.005997180938720703, 0.006211221218109131, 0.006425261497497559, 0.006639301776885986, 0.006853342056274414, 0.007067382335662842, 0.0072814226150512695, 0.007495462894439697, 0.007709503173828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 15.0, 18.0, 33.0, 60.0, 90.0, 138.0, 154.0, 149.0, 111.0, 96.0, 41.0, 30.0, 22.0, 16.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032929886132478714, -0.031552888453006744, -0.030175894498825073, -0.028798898681998253, -0.027421902865171432, -0.026044907048344612, -0.024667911231517792, -0.02329091541469097, -0.02191391959786415, -0.02053692378103733, -0.01915992796421051, -0.01778293214738369, -0.01640593633055687, -0.01502894051373005, -0.013651944696903229, -0.012274948880076408, -0.010897953063249588, -0.009520957246422768, -0.008143961429595947, -0.006766965612769127, -0.0053899697959423065, -0.004012973979115486, -0.0026359781622886658, -0.0012589823454618454, 0.00011801347136497498, 0.0014950092881917953, 0.0028720051050186157, 0.004249000921845436, 0.0056259967386722565, 0.007002992555499077, 0.008379988372325897, 0.009756984189152718, 0.011133983731269836, 0.012510979548096657, 0.013887975364923477, 0.015264971181750298, 0.016641966998577118, 0.01801896281540394, 0.01939595863223076, 0.02077295444905758, 0.0221499502658844, 0.02352694608271122, 0.02490394189953804, 0.02628093771636486, 0.02765793353319168, 0.0290349293500185, 0.03041192516684532, 0.03178892284631729, 0.03316591680049896, 0.034542910754680634, 0.0359199084341526, 0.03729690611362457, 0.038673900067806244, 0.040050894021987915, 0.041427891701459885, 0.042804889380931854, 0.044181883335113525, 0.0455588772892952, 0.046935874968767166, 0.048312872648239136, 0.04968986660242081, 0.05106686055660248, 0.05244385823607445, 0.05382085591554642, 0.05519784986972809]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 12.0, 15.0, 24.0, 17.0, 29.0, 22.0, 38.0, 35.0, 43.0, 50.0, 46.0, 48.0, 45.0, 60.0, 47.0, 46.0, 57.0, 45.0, 49.0, 29.0, 43.0, 32.0, 30.0, 24.0, 21.0, 17.0, 12.0, 15.0, 11.0, 6.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02670830488204956, -0.02584611438214779, -0.024983923882246017, -0.024121733382344246, -0.023259542882442474, -0.022397352382540703, -0.02153516188263893, -0.02067297138273716, -0.019810780882835388, -0.018948590382933617, -0.018086399883031845, -0.017224209383130074, -0.016362018883228302, -0.01549982838332653, -0.014637637883424759, -0.013775447383522987, -0.012913256883621216, -0.012051066383719444, -0.011188875883817673, -0.010326685383915901, -0.00946449488401413, -0.008602304384112358, -0.0077401138842105865, -0.006877923384308815, -0.0060157328844070435, -0.005153542384505272, -0.0042913518846035, -0.003429161384701729, -0.0025669708847999573, -0.0017047803848981857, -0.0008425898849964142, 1.960061490535736e-05, 0.0008817911148071289, 0.0017439816147089005, 0.002606172114610672, 0.0034683626145124435, 0.004330553114414215, 0.005192743614315987, 0.006054934114217758, 0.00691712461411953, 0.007779315114021301, 0.008641505613923073, 0.009503696113824844, 0.010365886613726616, 0.011228077113628387, 0.012090267613530159, 0.01295245811343193, 0.013814648613333702, 0.014676839113235474, 0.015539029613137245, 0.016401220113039017, 0.01726341061294079, 0.01812560111284256, 0.01898779161274433, 0.019849982112646103, 0.020712172612547874, 0.021574363112449646, 0.022436553612351418, 0.02329874411225319, 0.02416093461215496, 0.025023125112056732, 0.025885315611958504, 0.026747506111860275, 0.027609696611762047, 0.02847188711166382]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 10.0, 7.0, 10.0, 16.0, 28.0, 25.0, 54.0, 70.0, 90.0, 127.0, 170.0, 230.0, 341.0, 472.0, 662.0, 987.0, 1485.0, 2159.0, 3598.0, 6139.0, 11468.0, 27766.0, 595521.0, 345126.0, 25275.0, 10935.0, 5704.0, 3445.0, 2154.0, 1345.0, 932.0, 599.0, 453.0, 336.0, 194.0, 182.0, 120.0, 82.0, 64.0, 40.0, 36.0, 22.0, 20.0, 10.0, 9.0, 10.0, 4.0, 3.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.034210205078125, -0.033139705657958984, -0.03206920623779297, -0.030998706817626953, -0.029928207397460938, -0.028857707977294922, -0.027787208557128906, -0.02671670913696289, -0.025646209716796875, -0.02457571029663086, -0.023505210876464844, -0.022434711456298828, -0.021364212036132812, -0.020293712615966797, -0.01922321319580078, -0.018152713775634766, -0.01708221435546875, -0.016011714935302734, -0.014941215515136719, -0.013870716094970703, -0.012800216674804688, -0.011729717254638672, -0.010659217834472656, -0.00958871841430664, -0.008518218994140625, -0.007447719573974609, -0.006377220153808594, -0.005306720733642578, -0.0042362213134765625, -0.003165721893310547, -0.0020952224731445312, -0.0010247230529785156, 4.57763671875e-05, 0.0011162757873535156, 0.0021867752075195312, 0.003257274627685547, 0.0043277740478515625, 0.005398273468017578, 0.006468772888183594, 0.007539272308349609, 0.008609771728515625, 0.00968027114868164, 0.010750770568847656, 0.011821269989013672, 0.012891769409179688, 0.013962268829345703, 0.015032768249511719, 0.016103267669677734, 0.01717376708984375, 0.018244266510009766, 0.01931476593017578, 0.020385265350341797, 0.021455764770507812, 0.022526264190673828, 0.023596763610839844, 0.02466726303100586, 0.025737762451171875, 0.02680826187133789, 0.027878761291503906, 0.028949260711669922, 0.030019760131835938, 0.031090259552001953, 0.03216075897216797, 0.033231258392333984, 0.0343017578125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 5.0, 8.0, 2.0, 11.0, 9.0, 15.0, 69.0, 235.0, 351.0, 142.0, 40.0, 19.0, 9.0, 8.0, 7.0, 6.0, 7.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004428863525390625, -0.004282653331756592, -0.004136443138122559, -0.003990232944488525, -0.003844022750854492, -0.003697812557220459, -0.0035516023635864258, -0.0034053921699523926, -0.0032591819763183594, -0.003112971782684326, -0.002966761589050293, -0.0028205513954162598, -0.0026743412017822266, -0.0025281310081481934, -0.00238192081451416, -0.002235710620880127, -0.0020895004272460938, -0.0019432902336120605, -0.0017970800399780273, -0.0016508698463439941, -0.001504659652709961, -0.0013584494590759277, -0.0012122392654418945, -0.0010660290718078613, -0.0009198188781738281, -0.0007736086845397949, -0.0006273984909057617, -0.0004811882972717285, -0.0003349781036376953, -0.0001887679100036621, -4.2557716369628906e-05, 0.0001036524772644043, 0.0002498626708984375, 0.0003960728645324707, 0.0005422830581665039, 0.0006884932518005371, 0.0008347034454345703, 0.0009809136390686035, 0.0011271238327026367, 0.00127333402633667, 0.0014195442199707031, 0.0015657544136047363, 0.0017119646072387695, 0.0018581748008728027, 0.002004384994506836, 0.002150595188140869, 0.0022968053817749023, 0.0024430155754089355, 0.0025892257690429688, 0.002735435962677002, 0.002881646156311035, 0.0030278563499450684, 0.0031740665435791016, 0.0033202767372131348, 0.003466486930847168, 0.003612697124481201, 0.0037589073181152344, 0.0039051175117492676, 0.004051327705383301, 0.004197537899017334, 0.004343748092651367, 0.0044899582862854, 0.004636168479919434, 0.004782378673553467, 0.0049285888671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 11.0, 8.0, 26.0, 30.0, 30.0, 41.0, 71.0, 70.0, 126.0, 197.0, 401.0, 700.0, 1285.0, 3241.0, 10739.0, 166868.0, 831751.0, 24042.0, 4869.0, 1971.0, 823.0, 463.0, 267.0, 140.0, 126.0, 74.0, 50.0, 37.0, 22.0, 11.0, 12.0, 14.0, 8.0, 2.0, 5.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0908203125, -0.0882406234741211, -0.08566093444824219, -0.08308124542236328, -0.08050155639648438, -0.07792186737060547, -0.07534217834472656, -0.07276248931884766, -0.07018280029296875, -0.06760311126708984, -0.06502342224121094, -0.06244373321533203, -0.059864044189453125, -0.05728435516357422, -0.05470466613769531, -0.052124977111816406, -0.0495452880859375, -0.046965599060058594, -0.04438591003417969, -0.04180622100830078, -0.039226531982421875, -0.03664684295654297, -0.03406715393066406, -0.031487464904785156, -0.02890777587890625, -0.026328086853027344, -0.023748397827148438, -0.02116870880126953, -0.018589019775390625, -0.01600933074951172, -0.013429641723632812, -0.010849952697753906, -0.008270263671875, -0.005690574645996094, -0.0031108856201171875, -0.0005311965942382812, 0.002048492431640625, 0.004628181457519531, 0.0072078704833984375, 0.009787559509277344, 0.01236724853515625, 0.014946937561035156, 0.017526626586914062, 0.02010631561279297, 0.022686004638671875, 0.02526569366455078, 0.027845382690429688, 0.030425071716308594, 0.0330047607421875, 0.035584449768066406, 0.03816413879394531, 0.04074382781982422, 0.043323516845703125, 0.04590320587158203, 0.04848289489746094, 0.051062583923339844, 0.05364227294921875, 0.056221961975097656, 0.05880165100097656, 0.06138134002685547, 0.06396102905273438, 0.06654071807861328, 0.06912040710449219, 0.0717000961303711, 0.07427978515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 7.0, 17.0, 10.0, 15.0, 14.0, 14.0, 15.0, 30.0, 28.0, 29.0, 19.0, 31.0, 38.0, 34.0, 31.0, 43.0, 53.0, 38.0, 35.0, 43.0, 38.0, 41.0, 34.0, 31.0, 23.0, 30.0, 24.0, 29.0, 26.0, 22.0, 17.0, 31.0, 16.0, 24.0, 6.0, 9.0, 10.0, 8.0, 6.0, 7.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01751708984375, -0.016912221908569336, -0.016307353973388672, -0.015702486038208008, -0.015097618103027344, -0.01449275016784668, -0.013887882232666016, -0.013283014297485352, -0.012678146362304688, -0.012073278427124023, -0.01146841049194336, -0.010863542556762695, -0.010258674621582031, -0.009653806686401367, -0.009048938751220703, -0.008444070816040039, -0.007839202880859375, -0.007234334945678711, -0.006629467010498047, -0.006024599075317383, -0.005419731140136719, -0.004814863204956055, -0.004209995269775391, -0.0036051273345947266, -0.0030002593994140625, -0.0023953914642333984, -0.0017905235290527344, -0.0011856555938720703, -0.0005807876586914062, 2.4080276489257812e-05, 0.0006289482116699219, 0.001233816146850586, 0.00183868408203125, 0.002443552017211914, 0.003048419952392578, 0.003653287887573242, 0.004258155822753906, 0.00486302375793457, 0.005467891693115234, 0.0060727596282958984, 0.0066776275634765625, 0.0072824954986572266, 0.00788736343383789, 0.008492231369018555, 0.009097099304199219, 0.009701967239379883, 0.010306835174560547, 0.010911703109741211, 0.011516571044921875, 0.012121438980102539, 0.012726306915283203, 0.013331174850463867, 0.013936042785644531, 0.014540910720825195, 0.01514577865600586, 0.015750646591186523, 0.016355514526367188, 0.01696038246154785, 0.017565250396728516, 0.01817011833190918, 0.018774986267089844, 0.019379854202270508, 0.019984722137451172, 0.020589590072631836, 0.0211944580078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 5.0, 13.0, 18.0, 26.0, 24.0, 65.0, 120.0, 251.0, 668.0, 2246.0, 17242.0, 988102.0, 35251.0, 3105.0, 792.0, 289.0, 141.0, 87.0, 36.0, 26.0, 16.0, 18.0, 5.0, 2.0, 1.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07763671875, -0.07557201385498047, -0.07350730895996094, -0.0714426040649414, -0.06937789916992188, -0.06731319427490234, -0.06524848937988281, -0.06318378448486328, -0.06111907958984375, -0.05905437469482422, -0.05698966979980469, -0.054924964904785156, -0.052860260009765625, -0.050795555114746094, -0.04873085021972656, -0.04666614532470703, -0.0446014404296875, -0.04253673553466797, -0.04047203063964844, -0.038407325744628906, -0.036342620849609375, -0.034277915954589844, -0.03221321105957031, -0.03014850616455078, -0.02808380126953125, -0.02601909637451172, -0.023954391479492188, -0.021889686584472656, -0.019824981689453125, -0.017760276794433594, -0.015695571899414062, -0.013630867004394531, -0.011566162109375, -0.009501457214355469, -0.0074367523193359375, -0.005372047424316406, -0.003307342529296875, -0.0012426376342773438, 0.0008220672607421875, 0.0028867721557617188, 0.00495147705078125, 0.007016181945800781, 0.009080886840820312, 0.011145591735839844, 0.013210296630859375, 0.015275001525878906, 0.017339706420898438, 0.01940441131591797, 0.0214691162109375, 0.02353382110595703, 0.025598526000976562, 0.027663230895996094, 0.029727935791015625, 0.031792640686035156, 0.03385734558105469, 0.03592205047607422, 0.03798675537109375, 0.04005146026611328, 0.04211616516113281, 0.044180870056152344, 0.046245574951171875, 0.048310279846191406, 0.05037498474121094, 0.05243968963623047, 0.05450439453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 9.0, 9.0, 8.0, 9.0, 26.0, 31.0, 29.0, 29.0, 49.0, 64.0, 85.0, 91.0, 114.0, 88.0, 91.0, 41.0, 46.0, 37.0, 26.0, 20.0, 12.0, 6.0, 8.0, 6.0, 8.0, 10.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002155303955078125, -0.0020920783281326294, -0.002028852701187134, -0.001965627074241638, -0.0019024014472961426, -0.001839175820350647, -0.0017759501934051514, -0.0017127245664596558, -0.0016494989395141602, -0.0015862733125686646, -0.001523047685623169, -0.0014598220586776733, -0.0013965964317321777, -0.0013333708047866821, -0.0012701451778411865, -0.001206919550895691, -0.0011436939239501953, -0.0010804682970046997, -0.001017242670059204, -0.0009540170431137085, -0.0008907914161682129, -0.0008275657892227173, -0.0007643401622772217, -0.0007011145353317261, -0.0006378889083862305, -0.0005746632814407349, -0.0005114376544952393, -0.00044821202754974365, -0.00038498640060424805, -0.00032176077365875244, -0.00025853514671325684, -0.00019530951976776123, -0.00013208389282226562, -6.885826587677002e-05, -5.632638931274414e-06, 5.759298801422119e-05, 0.0001208186149597168, 0.0001840442419052124, 0.000247269868850708, 0.0003104954957962036, 0.0003737211227416992, 0.0004369467496871948, 0.0005001723766326904, 0.000563398003578186, 0.0006266236305236816, 0.0006898492574691772, 0.0007530748844146729, 0.0008163005113601685, 0.0008795261383056641, 0.0009427517652511597, 0.0010059773921966553, 0.0010692030191421509, 0.0011324286460876465, 0.001195654273033142, 0.0012588798999786377, 0.0013221055269241333, 0.001385331153869629, 0.0014485567808151245, 0.0015117824077606201, 0.0015750080347061157, 0.0016382336616516113, 0.001701459288597107, 0.0017646849155426025, 0.0018279105424880981, 0.0018911361694335938]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 17.0, 16.0, 27.0, 41.0, 69.0, 176.0, 433.0, 1504.0, 6324.0, 51823.0, 892137.0, 84994.0, 8130.0, 1862.0, 574.0, 225.0, 98.0, 48.0, 26.0, 11.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030103683471679688, -0.028926849365234375, -0.027750015258789062, -0.02657318115234375, -0.025396347045898438, -0.024219512939453125, -0.023042678833007812, -0.0218658447265625, -0.020689010620117188, -0.019512176513671875, -0.018335342407226562, -0.01715850830078125, -0.015981674194335938, -0.014804840087890625, -0.013628005981445312, -0.012451171875, -0.011274337768554688, -0.010097503662109375, -0.008920669555664062, -0.00774383544921875, -0.0065670013427734375, -0.005390167236328125, -0.0042133331298828125, -0.0030364990234375, -0.0018596649169921875, -0.000682830810546875, 0.0004940032958984375, 0.00167083740234375, 0.0028476715087890625, 0.004024505615234375, 0.0052013397216796875, 0.006378173828125, 0.0075550079345703125, 0.008731842041015625, 0.009908676147460938, 0.01108551025390625, 0.012262344360351562, 0.013439178466796875, 0.014616012573242188, 0.0157928466796875, 0.016969680786132812, 0.018146514892578125, 0.019323348999023438, 0.02050018310546875, 0.021677017211914062, 0.022853851318359375, 0.024030685424804688, 0.02520751953125, 0.026384353637695312, 0.027561187744140625, 0.028738021850585938, 0.02991485595703125, 0.031091690063476562, 0.032268524169921875, 0.03344535827636719, 0.0346221923828125, 0.03579902648925781, 0.036975860595703125, 0.03815269470214844, 0.03932952880859375, 0.04050636291503906, 0.041683197021484375, 0.04286003112792969, 0.044036865234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 11.0, 15.0, 11.0, 14.0, 15.0, 30.0, 56.0, 55.0, 66.0, 80.0, 110.0, 104.0, 84.0, 67.0, 65.0, 46.0, 37.0, 28.0, 21.0, 15.0, 14.0, 6.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01605224609375, -0.01554250717163086, -0.015032768249511719, -0.014523029327392578, -0.014013290405273438, -0.013503551483154297, -0.012993812561035156, -0.012484073638916016, -0.011974334716796875, -0.011464595794677734, -0.010954856872558594, -0.010445117950439453, -0.009935379028320312, -0.009425640106201172, -0.008915901184082031, -0.00840616226196289, -0.00789642333984375, -0.007386684417724609, -0.006876945495605469, -0.006367206573486328, -0.0058574676513671875, -0.005347728729248047, -0.004837989807128906, -0.004328250885009766, -0.003818511962890625, -0.0033087730407714844, -0.0027990341186523438, -0.002289295196533203, -0.0017795562744140625, -0.0012698173522949219, -0.0007600784301757812, -0.0002503395080566406, 0.0002593994140625, 0.0007691383361816406, 0.0012788772583007812, 0.0017886161804199219, 0.0022983551025390625, 0.002808094024658203, 0.0033178329467773438, 0.0038275718688964844, 0.004337310791015625, 0.004847049713134766, 0.005356788635253906, 0.005866527557373047, 0.0063762664794921875, 0.006886005401611328, 0.007395744323730469, 0.00790548324584961, 0.00841522216796875, 0.00892496109008789, 0.009434700012207031, 0.009944438934326172, 0.010454177856445312, 0.010963916778564453, 0.011473655700683594, 0.011983394622802734, 0.012493133544921875, 0.013002872467041016, 0.013512611389160156, 0.014022350311279297, 0.014532089233398438, 0.015041828155517578, 0.015551567077636719, 0.01606130599975586, 0.016571044921875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 28.0, 229.0, 631.0, 59.0, 17.0, 14.0, 5.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8714686632156372, -0.8435510993003845, -0.8156334757804871, -0.7877159118652344, -0.7597983479499817, -0.731880784034729, -0.7039631605148315, -0.6760455965995789, -0.6481280326843262, -0.6202104687690735, -0.592292845249176, -0.5643752813339233, -0.5364577174186707, -0.508540153503418, -0.4806225299835205, -0.4527049660682678, -0.42478734254837036, -0.3968697488307953, -0.3689521849155426, -0.34103459119796753, -0.31311702728271484, -0.28519943356513977, -0.2572818398475647, -0.22936426103115082, -0.20144668221473694, -0.17352910339832306, -0.14561152458190918, -0.1176939308643341, -0.08977635204792023, -0.06185877323150635, -0.033941179513931274, -0.006023600697517395, 0.02189391851425171, 0.04981150105595589, 0.07772908359766006, 0.10564666986465454, 0.13356424868106842, 0.1614818274974823, 0.18939942121505737, 0.21731700003147125, 0.24523457884788513, 0.2731521725654602, 0.3010697364807129, 0.32898733019828796, 0.35690492391586304, 0.3848224878311157, 0.4127400815486908, 0.44065767526626587, 0.46857523918151855, 0.49649283289909363, 0.5244104266166687, 0.5523279905319214, 0.5802455544471741, 0.6081631183624268, 0.6360807418823242, 0.6639983057975769, 0.6919158697128296, 0.7198334336280823, 0.7477510571479797, 0.7756686210632324, 0.8035861849784851, 0.8315037488937378, 0.8594213724136353, 0.8873389363288879, 0.9152565598487854]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 1.0, 4.0, 4.0, 4.0, 6.0, 2.0, 5.0, 10.0, 15.0, 22.0, 47.0, 79.0, 114.0, 159.0, 152.0, 138.0, 87.0, 46.0, 35.0, 23.0, 12.0, 5.0, 3.0, 4.0, 4.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4582235813140869, -0.4447319805622101, -0.43124035000801086, -0.41774874925613403, -0.4042571485042572, -0.39076554775238037, -0.37727391719818115, -0.3637823164463043, -0.3502907156944275, -0.33679911494255066, -0.32330748438835144, -0.3098158836364746, -0.2963242828845978, -0.28283268213272095, -0.26934105157852173, -0.2558494508266449, -0.24235783517360687, -0.22886621952056885, -0.21537461876869202, -0.201883003115654, -0.18839140236377716, -0.17489978671073914, -0.1614081859588623, -0.14791657030582428, -0.13442495465278625, -0.12093334645032883, -0.1074417382478714, -0.09395012259483337, -0.08045852184295654, -0.06696690618991852, -0.05347529798746109, -0.03998368978500366, -0.02649208903312683, -0.013000479899346828, 0.0004911292344331741, 0.013982739299535751, 0.02747434750199318, 0.040965959429740906, 0.054457567632198334, 0.06794917583465576, 0.08144078403711319, 0.09493239223957062, 0.10842400044202805, 0.12191560864448547, 0.1354072242975235, 0.14889883995056152, 0.16239044070243835, 0.17588204145431519, 0.1893736571073532, 0.20286527276039124, 0.21635687351226807, 0.2298484891653061, 0.24334008991718292, 0.25683170557022095, 0.2703233063220978, 0.2838149070739746, 0.29730653762817383, 0.31079813838005066, 0.3242897689342499, 0.3377813696861267, 0.35127297043800354, 0.36476457118988037, 0.3782562017440796, 0.3917478024959564, 0.40523940324783325]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 10.0, 8.0, 11.0, 16.0, 11.0, 24.0, 26.0, 43.0, 108.0, 729.0, 23959.0, 4166997.0, 2032.0, 108.0, 57.0, 37.0, 21.0, 17.0, 15.0, 10.0, 9.0, 5.0, 3.0, 6.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.109375, -2.0543060302734375, -1.999237060546875, -1.9441680908203125, -1.88909912109375, -1.8340301513671875, -1.778961181640625, -1.7238922119140625, -1.6688232421875, -1.6137542724609375, -1.558685302734375, -1.5036163330078125, -1.44854736328125, -1.3934783935546875, -1.338409423828125, -1.2833404541015625, -1.228271484375, -1.1732025146484375, -1.118133544921875, -1.0630645751953125, -1.00799560546875, -0.9529266357421875, -0.897857666015625, -0.8427886962890625, -0.7877197265625, -0.7326507568359375, -0.677581787109375, -0.6225128173828125, -0.56744384765625, -0.5123748779296875, -0.457305908203125, -0.4022369384765625, -0.34716796875, -0.2920989990234375, -0.237030029296875, -0.1819610595703125, -0.12689208984375, -0.0718231201171875, -0.016754150390625, 0.0383148193359375, 0.0933837890625, 0.1484527587890625, 0.203521728515625, 0.2585906982421875, 0.31365966796875, 0.3687286376953125, 0.423797607421875, 0.4788665771484375, 0.533935546875, 0.5890045166015625, 0.644073486328125, 0.6991424560546875, 0.75421142578125, 0.8092803955078125, 0.864349365234375, 0.9194183349609375, 0.9744873046875, 1.0295562744140625, 1.084625244140625, 1.1396942138671875, 1.19476318359375, 1.2498321533203125, 1.304901123046875, 1.3599700927734375, 1.4150390625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 11.0, 5.0, 8.0, 10.0, 13.0, 11.0, 27.0, 34.0, 78.0, 107.0, 158.0, 157.0, 97.0, 85.0, 59.0, 30.0, 11.0, 10.0, 11.0, 7.0, 4.0, 7.0, 9.0, 3.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003025054931640625, -0.0029384493827819824, -0.00285184383392334, -0.0027652382850646973, -0.0026786327362060547, -0.002592027187347412, -0.0025054216384887695, -0.002418816089630127, -0.0023322105407714844, -0.002245604991912842, -0.0021589994430541992, -0.0020723938941955566, -0.001985788345336914, -0.0018991827964782715, -0.001812577247619629, -0.0017259716987609863, -0.0016393661499023438, -0.0015527606010437012, -0.0014661550521850586, -0.001379549503326416, -0.0012929439544677734, -0.0012063384056091309, -0.0011197328567504883, -0.0010331273078918457, -0.0009465217590332031, -0.0008599162101745605, -0.000773310661315918, -0.0006867051124572754, -0.0006000995635986328, -0.0005134940147399902, -0.00042688846588134766, -0.0003402829170227051, -0.0002536773681640625, -0.00016707181930541992, -8.046627044677734e-05, 6.139278411865234e-06, 9.274482727050781e-05, 0.0001793503761291504, 0.00026595592498779297, 0.00035256147384643555, 0.0004391670227050781, 0.0005257725715637207, 0.0006123781204223633, 0.0006989836692810059, 0.0007855892181396484, 0.000872194766998291, 0.0009588003158569336, 0.0010454058647155762, 0.0011320114135742188, 0.0012186169624328613, 0.001305222511291504, 0.0013918280601501465, 0.001478433609008789, 0.0015650391578674316, 0.0016516447067260742, 0.0017382502555847168, 0.0018248558044433594, 0.001911461353302002, 0.0019980669021606445, 0.002084672451019287, 0.0021712779998779297, 0.0022578835487365723, 0.002344489097595215, 0.0024310946464538574, 0.0025177001953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 6.0, 10.0, 7.0, 10.0, 13.0, 25.0, 23.0, 29.0, 39.0, 49.0, 64.0, 76.0, 96.0, 142.0, 220.0, 1362.0, 4033475.0, 157222.0, 643.0, 178.0, 141.0, 100.0, 89.0, 49.0, 56.0, 24.0, 34.0, 24.0, 15.0, 24.0, 6.0, 5.0, 3.0, 11.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26953125, -0.2595024108886719, -0.24947357177734375, -0.23944473266601562, -0.2294158935546875, -0.21938705444335938, -0.20935821533203125, -0.19932937622070312, -0.189300537109375, -0.17927169799804688, -0.16924285888671875, -0.15921401977539062, -0.1491851806640625, -0.13915634155273438, -0.12912750244140625, -0.11909866333007812, -0.10906982421875, -0.09904098510742188, -0.08901214599609375, -0.07898330688476562, -0.0689544677734375, -0.058925628662109375, -0.04889678955078125, -0.038867950439453125, -0.028839111328125, -0.018810272216796875, -0.00878143310546875, 0.001247406005859375, 0.0112762451171875, 0.021305084228515625, 0.03133392333984375, 0.041362762451171875, 0.0513916015625, 0.061420440673828125, 0.07144927978515625, 0.08147811889648438, 0.0915069580078125, 0.10153579711914062, 0.11156463623046875, 0.12159347534179688, 0.131622314453125, 0.14165115356445312, 0.15167999267578125, 0.16170883178710938, 0.1717376708984375, 0.18176651000976562, 0.19179534912109375, 0.20182418823242188, 0.21185302734375, 0.22188186645507812, 0.23191070556640625, 0.24193954467773438, 0.2519683837890625, 0.2619972229003906, 0.27202606201171875, 0.2820549011230469, 0.292083740234375, 0.3021125793457031, 0.31214141845703125, 0.3221702575683594, 0.3321990966796875, 0.3422279357910156, 0.35225677490234375, 0.3622856140136719, 0.372314453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 7.0, 7.0, 12.0, 12.0, 14.0, 15.0, 22.0, 31.0, 57.0, 77.0, 101.0, 131.0, 230.0, 325.0, 547.0, 899.0, 505.0, 287.0, 210.0, 186.0, 110.0, 78.0, 55.0, 34.0, 21.0, 26.0, 19.0, 12.0, 7.0, 7.0, 2.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004611968994140625, -0.0044699907302856445, -0.004328012466430664, -0.004186034202575684, -0.004044055938720703, -0.0039020776748657227, -0.003760099411010742, -0.0036181211471557617, -0.0034761428833007812, -0.0033341646194458008, -0.0031921863555908203, -0.00305020809173584, -0.0029082298278808594, -0.002766251564025879, -0.0026242733001708984, -0.002482295036315918, -0.0023403167724609375, -0.002198338508605957, -0.0020563602447509766, -0.001914381980895996, -0.0017724037170410156, -0.0016304254531860352, -0.0014884471893310547, -0.0013464689254760742, -0.0012044906616210938, -0.0010625123977661133, -0.0009205341339111328, -0.0007785558700561523, -0.0006365776062011719, -0.0004945993423461914, -0.00035262107849121094, -0.00021064281463623047, -6.866455078125e-05, 7.331371307373047e-05, 0.00021529197692871094, 0.0003572702407836914, 0.0004992485046386719, 0.0006412267684936523, 0.0007832050323486328, 0.0009251832962036133, 0.0010671615600585938, 0.0012091398239135742, 0.0013511180877685547, 0.0014930963516235352, 0.0016350746154785156, 0.001777052879333496, 0.0019190311431884766, 0.002061009407043457, 0.0022029876708984375, 0.002344965934753418, 0.0024869441986083984, 0.002628922462463379, 0.0027709007263183594, 0.00291287899017334, 0.0030548572540283203, 0.0031968355178833008, 0.0033388137817382812, 0.0034807920455932617, 0.003622770309448242, 0.0037647485733032227, 0.003906726837158203, 0.004048705101013184, 0.004190683364868164, 0.0043326616287231445, 0.004474639892578125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 8.0, 159.0, 810.0, 39.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04298434779047966, -0.029278934001922607, -0.015573520213365555, -0.0018681064248085022, 0.01183730736374855, 0.0255427248775959, 0.039248134940862656, 0.05295354500412941, 0.06665895879268646, 0.08036437630653381, 0.09406978636980057, 0.10777519643306732, 0.12148061394691467, 0.13518603146076202, 0.14889144897460938, 0.16259685158729553, 0.17630226910114288, 0.19000768661499023, 0.2037130892276764, 0.21741850674152374, 0.2311239242553711, 0.24482934176921844, 0.2585347592830658, 0.27224016189575195, 0.2859455943107605, 0.29965099692344666, 0.3133564293384552, 0.32706183195114136, 0.3407672643661499, 0.35447266697883606, 0.3681780695915222, 0.38188350200653076, 0.39558887481689453, 0.4092942774295807, 0.42299970984458923, 0.4367051124572754, 0.45041054487228394, 0.4641159474849701, 0.47782135009765625, 0.4915267825126648, 0.5052322149276733, 0.5189376473426819, 0.5326430201530457, 0.5463484525680542, 0.5600538849830627, 0.5737593173980713, 0.5874646902084351, 0.6011701226234436, 0.6148754954338074, 0.6285809278488159, 0.6422863006591797, 0.6559917330741882, 0.6696971654891968, 0.6834025382995605, 0.6971079707145691, 0.7108134031295776, 0.7245187759399414, 0.73822420835495, 0.7519295811653137, 0.7656350135803223, 0.7793404459953308, 0.7930458784103394, 0.8067512512207031, 0.8204566836357117, 0.8341621160507202]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 12.0, 10.0, 21.0, 33.0, 58.0, 88.0, 102.0, 122.0, 120.0, 103.0, 106.0, 79.0, 56.0, 38.0, 24.0, 11.0, 9.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02246958017349243, -0.02055458351969719, -0.018639585003256798, -0.016724586486816406, -0.014809589833021164, -0.012894592247903347, -0.01097959466278553, -0.009064597077667713, -0.007149599492549896, -0.005234601907432079, -0.0033196043223142624, -0.0014046067371964455, 0.0005103908479213715, 0.0024253884330391884, 0.004340386018157005, 0.006255383603274822, 0.00817038118839264, 0.010085378773510456, 0.012000376358628273, 0.01391537394374609, 0.015830371528863907, 0.01774536818265915, 0.01966036669909954, 0.021575365215539932, 0.023490361869335175, 0.025405358523130417, 0.02732035703957081, 0.0292353555560112, 0.031150352209806442, 0.033065348863601685, 0.034980349242687225, 0.03689534589648247, 0.03881034255027771, 0.04072533920407295, 0.042640335857868195, 0.044555336236953735, 0.04647033289074898, 0.04838532954454422, 0.05030032992362976, 0.052215326577425, 0.054130323231220245, 0.05604531988501549, 0.05796031653881073, 0.05987531691789627, 0.06179031357169151, 0.06370531022548676, 0.0656203106045723, 0.06753530353307724, 0.06945030391216278, 0.07136530429124832, 0.07328029721975327, 0.0751952975988388, 0.07711029052734375, 0.07902529090642929, 0.08094029128551483, 0.08285528421401978, 0.08477028459310532, 0.08668528497219086, 0.0886002779006958, 0.09051527827978134, 0.09243027865886688, 0.09434527158737183, 0.09626027196645737, 0.09817526489496231, 0.10009026527404785]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 4.0, 4.0, 8.0, 12.0, 15.0, 23.0, 18.0, 39.0, 25.0, 39.0, 78.0, 225.0, 923.0, 5108.0, 47532.0, 956079.0, 33027.0, 4113.0, 798.0, 206.0, 80.0, 47.0, 30.0, 26.0, 15.0, 9.0, 19.0, 9.0, 10.0, 3.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08380126953125, -0.08104801177978516, -0.07829475402832031, -0.07554149627685547, -0.07278823852539062, -0.07003498077392578, -0.06728172302246094, -0.0645284652709961, -0.06177520751953125, -0.059021949768066406, -0.05626869201660156, -0.05351543426513672, -0.050762176513671875, -0.04800891876220703, -0.04525566101074219, -0.042502403259277344, -0.0397491455078125, -0.036995887756347656, -0.03424263000488281, -0.03148937225341797, -0.028736114501953125, -0.02598285675048828, -0.023229598999023438, -0.020476341247558594, -0.01772308349609375, -0.014969825744628906, -0.012216567993164062, -0.009463310241699219, -0.006710052490234375, -0.003956794738769531, -0.0012035369873046875, 0.0015497207641601562, 0.004302978515625, 0.007056236267089844, 0.009809494018554688, 0.012562751770019531, 0.015316009521484375, 0.01806926727294922, 0.020822525024414062, 0.023575782775878906, 0.02632904052734375, 0.029082298278808594, 0.03183555603027344, 0.03458881378173828, 0.037342071533203125, 0.04009532928466797, 0.04284858703613281, 0.045601844787597656, 0.0483551025390625, 0.051108360290527344, 0.05386161804199219, 0.05661487579345703, 0.059368133544921875, 0.06212139129638672, 0.06487464904785156, 0.0676279067993164, 0.07038116455078125, 0.0731344223022461, 0.07588768005371094, 0.07864093780517578, 0.08139419555664062, 0.08414745330810547, 0.08690071105957031, 0.08965396881103516, 0.0924072265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 4.0, 0.0, 8.0, 9.0, 17.0, 28.0, 84.0, 253.0, 328.0, 162.0, 46.0, 24.0, 13.0, 18.0, 5.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00287628173828125, -0.0026438236236572266, -0.002411365509033203, -0.0021789073944091797, -0.0019464492797851562, -0.0017139911651611328, -0.0014815330505371094, -0.001249074935913086, -0.0010166168212890625, -0.0007841587066650391, -0.0005517005920410156, -0.0003192424774169922, -8.678436279296875e-05, 0.0001456737518310547, 0.0003781318664550781, 0.0006105899810791016, 0.000843048095703125, 0.0010755062103271484, 0.0013079643249511719, 0.0015404224395751953, 0.0017728805541992188, 0.002005338668823242, 0.0022377967834472656, 0.002470254898071289, 0.0027027130126953125, 0.002935171127319336, 0.0031676292419433594, 0.003400087356567383, 0.0036325454711914062, 0.0038650035858154297, 0.004097461700439453, 0.0043299198150634766, 0.0045623779296875, 0.0047948360443115234, 0.005027294158935547, 0.00525975227355957, 0.005492210388183594, 0.005724668502807617, 0.005957126617431641, 0.006189584732055664, 0.0064220428466796875, 0.006654500961303711, 0.006886959075927734, 0.007119417190551758, 0.007351875305175781, 0.007584333419799805, 0.007816791534423828, 0.008049249649047852, 0.008281707763671875, 0.008514165878295898, 0.008746623992919922, 0.008979082107543945, 0.009211540222167969, 0.009443998336791992, 0.009676456451416016, 0.009908914566040039, 0.010141372680664062, 0.010373830795288086, 0.01060628890991211, 0.010838747024536133, 0.011071205139160156, 0.01130366325378418, 0.011536121368408203, 0.011768579483032227, 0.01200103759765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 10.0, 11.0, 16.0, 15.0, 20.0, 27.0, 31.0, 25.0, 55.0, 84.0, 384.0, 3499.0, 357317.0, 680882.0, 5350.0, 477.0, 123.0, 42.0, 23.0, 27.0, 35.0, 12.0, 17.0, 15.0, 3.0, 13.0, 8.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0821533203125, -0.07922554016113281, -0.07629776000976562, -0.07336997985839844, -0.07044219970703125, -0.06751441955566406, -0.06458663940429688, -0.06165885925292969, -0.0587310791015625, -0.05580329895019531, -0.052875518798828125, -0.04994773864746094, -0.04701995849609375, -0.04409217834472656, -0.041164398193359375, -0.03823661804199219, -0.035308837890625, -0.03238105773925781, -0.029453277587890625, -0.026525497436523438, -0.02359771728515625, -0.020669937133789062, -0.017742156982421875, -0.014814376831054688, -0.0118865966796875, -0.008958816528320312, -0.006031036376953125, -0.0031032562255859375, -0.00017547607421875, 0.0027523040771484375, 0.005680084228515625, 0.008607864379882812, 0.01153564453125, 0.014463424682617188, 0.017391204833984375, 0.020318984985351562, 0.02324676513671875, 0.026174545288085938, 0.029102325439453125, 0.03203010559082031, 0.0349578857421875, 0.03788566589355469, 0.040813446044921875, 0.04374122619628906, 0.04666900634765625, 0.04959678649902344, 0.052524566650390625, 0.05545234680175781, 0.058380126953125, 0.06130790710449219, 0.06423568725585938, 0.06716346740722656, 0.07009124755859375, 0.07301902770996094, 0.07594680786132812, 0.07887458801269531, 0.0818023681640625, 0.08473014831542969, 0.08765792846679688, 0.09058570861816406, 0.09351348876953125, 0.09644126892089844, 0.09936904907226562, 0.10229682922363281, 0.105224609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 13.0, 11.0, 11.0, 14.0, 16.0, 22.0, 20.0, 22.0, 27.0, 19.0, 37.0, 36.0, 36.0, 46.0, 42.0, 40.0, 51.0, 64.0, 44.0, 42.0, 44.0, 34.0, 27.0, 26.0, 27.0, 29.0, 19.0, 28.0, 32.0, 21.0, 18.0, 10.0, 15.0, 9.0, 12.0, 4.0, 6.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01145172119140625, -0.01109921932220459, -0.01074671745300293, -0.01039421558380127, -0.01004171371459961, -0.00968921184539795, -0.009336709976196289, -0.008984208106994629, -0.008631706237792969, -0.008279204368591309, -0.007926702499389648, -0.007574200630187988, -0.007221698760986328, -0.006869196891784668, -0.006516695022583008, -0.006164193153381348, -0.0058116912841796875, -0.005459189414978027, -0.005106687545776367, -0.004754185676574707, -0.004401683807373047, -0.004049181938171387, -0.0036966800689697266, -0.0033441781997680664, -0.0029916763305664062, -0.002639174461364746, -0.002286672592163086, -0.0019341707229614258, -0.0015816688537597656, -0.0012291669845581055, -0.0008766651153564453, -0.0005241632461547852, -0.000171661376953125, 0.00018084049224853516, 0.0005333423614501953, 0.0008858442306518555, 0.0012383460998535156, 0.0015908479690551758, 0.001943349838256836, 0.002295851707458496, 0.0026483535766601562, 0.0030008554458618164, 0.0033533573150634766, 0.0037058591842651367, 0.004058361053466797, 0.004410862922668457, 0.004763364791870117, 0.005115866661071777, 0.0054683685302734375, 0.005820870399475098, 0.006173372268676758, 0.006525874137878418, 0.006878376007080078, 0.007230877876281738, 0.0075833797454833984, 0.007935881614685059, 0.008288383483886719, 0.008640885353088379, 0.008993387222290039, 0.0093458890914917, 0.00969839096069336, 0.01005089282989502, 0.01040339469909668, 0.01075589656829834, 0.0111083984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 10.0, 14.0, 36.0, 89.0, 381.0, 8923.0, 1037235.0, 1554.0, 183.0, 57.0, 22.0, 11.0, 8.0, 5.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2335205078125, -0.2258167266845703, -0.21811294555664062, -0.21040916442871094, -0.20270538330078125, -0.19500160217285156, -0.18729782104492188, -0.1795940399169922, -0.1718902587890625, -0.1641864776611328, -0.15648269653320312, -0.14877891540527344, -0.14107513427734375, -0.13337135314941406, -0.12566757202148438, -0.11796379089355469, -0.110260009765625, -0.10255622863769531, -0.09485244750976562, -0.08714866638183594, -0.07944488525390625, -0.07174110412597656, -0.06403732299804688, -0.05633354187011719, -0.0486297607421875, -0.04092597961425781, -0.033222198486328125, -0.025518417358398438, -0.01781463623046875, -0.010110855102539062, -0.002407073974609375, 0.0052967071533203125, 0.01300048828125, 0.020704269409179688, 0.028408050537109375, 0.03611183166503906, 0.04381561279296875, 0.05151939392089844, 0.059223175048828125, 0.06692695617675781, 0.0746307373046875, 0.08233451843261719, 0.09003829956054688, 0.09774208068847656, 0.10544586181640625, 0.11314964294433594, 0.12085342407226562, 0.1285572052001953, 0.136260986328125, 0.1439647674560547, 0.15166854858398438, 0.15937232971191406, 0.16707611083984375, 0.17477989196777344, 0.18248367309570312, 0.1901874542236328, 0.1978912353515625, 0.2055950164794922, 0.21329879760742188, 0.22100257873535156, 0.22870635986328125, 0.23641014099121094, 0.24411392211914062, 0.2518177032470703, 0.259521484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 6.0, 16.0, 20.0, 41.0, 74.0, 361.0, 295.0, 58.0, 33.0, 14.0, 14.0, 12.0, 12.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0029010772705078125, -0.0028318464756011963, -0.00276261568069458, -0.002693384885787964, -0.0026241540908813477, -0.0025549232959747314, -0.0024856925010681152, -0.002416461706161499, -0.002347230911254883, -0.0022780001163482666, -0.0022087693214416504, -0.002139538526535034, -0.002070307731628418, -0.0020010769367218018, -0.0019318461418151855, -0.0018626153469085693, -0.0017933845520019531, -0.001724153757095337, -0.0016549229621887207, -0.0015856921672821045, -0.0015164613723754883, -0.001447230577468872, -0.0013779997825622559, -0.0013087689876556396, -0.0012395381927490234, -0.0011703073978424072, -0.001101076602935791, -0.0010318458080291748, -0.0009626150131225586, -0.0008933842182159424, -0.0008241534233093262, -0.00075492262840271, -0.0006856918334960938, -0.0006164610385894775, -0.0005472302436828613, -0.0004779994487762451, -0.0004087686538696289, -0.0003395378589630127, -0.0002703070640563965, -0.00020107626914978027, -0.00013184547424316406, -6.261467933654785e-05, 6.616115570068359e-06, 7.584691047668457e-05, 0.00014507770538330078, 0.000214308500289917, 0.0002835392951965332, 0.0003527700901031494, 0.0004220008850097656, 0.0004912316799163818, 0.000560462474822998, 0.0006296932697296143, 0.0006989240646362305, 0.0007681548595428467, 0.0008373856544494629, 0.0009066164493560791, 0.0009758472442626953, 0.0010450780391693115, 0.0011143088340759277, 0.001183539628982544, 0.0012527704238891602, 0.0013220012187957764, 0.0013912320137023926, 0.0014604628086090088, 0.001529693603515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 12.0, 11.0, 19.0, 30.0, 34.0, 55.0, 85.0, 173.0, 319.0, 714.0, 2163.0, 9456.0, 95604.0, 884027.0, 46422.0, 6376.0, 1694.0, 645.0, 259.0, 178.0, 90.0, 72.0, 30.0, 28.0, 16.0, 14.0, 3.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062225341796875, -0.06041574478149414, -0.05860614776611328, -0.05679655075073242, -0.05498695373535156, -0.0531773567199707, -0.051367759704589844, -0.049558162689208984, -0.047748565673828125, -0.045938968658447266, -0.044129371643066406, -0.04231977462768555, -0.04051017761230469, -0.03870058059692383, -0.03689098358154297, -0.03508138656616211, -0.03327178955078125, -0.03146219253540039, -0.02965259552001953, -0.027842998504638672, -0.026033401489257812, -0.024223804473876953, -0.022414207458496094, -0.020604610443115234, -0.018795013427734375, -0.016985416412353516, -0.015175819396972656, -0.013366222381591797, -0.011556625366210938, -0.009747028350830078, -0.007937431335449219, -0.006127834320068359, -0.0043182373046875, -0.0025086402893066406, -0.0006990432739257812, 0.0011105537414550781, 0.0029201507568359375, 0.004729747772216797, 0.006539344787597656, 0.008348941802978516, 0.010158538818359375, 0.011968135833740234, 0.013777732849121094, 0.015587329864501953, 0.017396926879882812, 0.019206523895263672, 0.02101612091064453, 0.02282571792602539, 0.02463531494140625, 0.02644491195678711, 0.02825450897216797, 0.030064105987548828, 0.03187370300292969, 0.03368330001831055, 0.035492897033691406, 0.037302494049072266, 0.039112091064453125, 0.040921688079833984, 0.042731285095214844, 0.0445408821105957, 0.04635047912597656, 0.04816007614135742, 0.04996967315673828, 0.05177927017211914, 0.0535888671875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 5.0, 4.0, 5.0, 6.0, 13.0, 15.0, 21.0, 21.0, 41.0, 69.0, 95.0, 136.0, 153.0, 139.0, 93.0, 61.0, 38.0, 18.0, 15.0, 14.0, 13.0, 7.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01352691650390625, -0.012825369834899902, -0.012123823165893555, -0.011422276496887207, -0.01072072982788086, -0.010019183158874512, -0.009317636489868164, -0.008616089820861816, -0.007914543151855469, -0.007212996482849121, -0.0065114498138427734, -0.005809903144836426, -0.005108356475830078, -0.0044068098068237305, -0.003705263137817383, -0.003003716468811035, -0.0023021697998046875, -0.0016006231307983398, -0.0008990764617919922, -0.00019752979278564453, 0.0005040168762207031, 0.0012055635452270508, 0.0019071102142333984, 0.002608656883239746, 0.0033102035522460938, 0.004011750221252441, 0.004713296890258789, 0.005414843559265137, 0.006116390228271484, 0.006817936897277832, 0.00751948356628418, 0.008221030235290527, 0.008922576904296875, 0.009624123573303223, 0.01032567024230957, 0.011027216911315918, 0.011728763580322266, 0.012430310249328613, 0.013131856918334961, 0.013833403587341309, 0.014534950256347656, 0.015236496925354004, 0.01593804359436035, 0.0166395902633667, 0.017341136932373047, 0.018042683601379395, 0.018744230270385742, 0.01944577693939209, 0.020147323608398438, 0.020848870277404785, 0.021550416946411133, 0.02225196361541748, 0.022953510284423828, 0.023655056953430176, 0.024356603622436523, 0.02505815029144287, 0.02575969696044922, 0.026461243629455566, 0.027162790298461914, 0.02786433696746826, 0.02856588363647461, 0.029267430305480957, 0.029968976974487305, 0.030670523643493652, 0.0313720703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 10.0, 16.0, 43.0, 88.0, 184.0, 261.0, 211.0, 98.0, 31.0, 19.0, 11.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19143696129322052, -0.1858953833580017, -0.1803537905216217, -0.1748121976852417, -0.1692706197500229, -0.16372904181480408, -0.15818744897842407, -0.15264585614204407, -0.14710427820682526, -0.14156270027160645, -0.13602110743522644, -0.13047951459884644, -0.12493793666362762, -0.11939635127782822, -0.11385476589202881, -0.1083131805062294, -0.10277159512042999, -0.09723000973463058, -0.09168842434883118, -0.08614683896303177, -0.08060525357723236, -0.07506366819143295, -0.06952208280563354, -0.06398049741983414, -0.05843891203403473, -0.05289732664823532, -0.04735574126243591, -0.041814155876636505, -0.0362725704908371, -0.03073098510503769, -0.02518939971923828, -0.019647814333438873, -0.01410624384880066, -0.008564658463001251, -0.0030230730772018433, 0.0025185123085975647, 0.008060097694396973, 0.01360168308019638, 0.01914326846599579, 0.024684853851795197, 0.030226439237594604, 0.03576802462339401, 0.04130961000919342, 0.04685119539499283, 0.052392780780792236, 0.057934366166591644, 0.06347595155239105, 0.06901753693819046, 0.07455912232398987, 0.08010070770978928, 0.08564229309558868, 0.09118387848138809, 0.0967254638671875, 0.10226704925298691, 0.10780863463878632, 0.11335022002458572, 0.11889180541038513, 0.12443339079618454, 0.12997497618198395, 0.13551655411720276, 0.14105814695358276, 0.14659973978996277, 0.15214131772518158, 0.1576828956604004, 0.1632244884967804]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 4.0, 16.0, 19.0, 26.0, 34.0, 55.0, 100.0, 86.0, 130.0, 131.0, 93.0, 87.0, 70.0, 36.0, 38.0, 24.0, 16.0, 7.0, 6.0, 7.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22065919637680054, -0.2150178849697113, -0.20937658846378326, -0.20373529195785522, -0.198093980550766, -0.19245266914367676, -0.18681137263774872, -0.18117007613182068, -0.17552876472473145, -0.1698874533176422, -0.16424615681171417, -0.15860486030578613, -0.1529635488986969, -0.14732223749160767, -0.14168094098567963, -0.1360396444797516, -0.13039833307266235, -0.12475702911615372, -0.11911572515964508, -0.11347442120313644, -0.10783311724662781, -0.10219181329011917, -0.09655050933361053, -0.0909092053771019, -0.08526790142059326, -0.07962659746408463, -0.07398529350757599, -0.06834398955106735, -0.06270268559455872, -0.05706138163805008, -0.05142007768154144, -0.045778773725032806, -0.04013746976852417, -0.03449616581201553, -0.028854861855506897, -0.02321355789899826, -0.017572253942489624, -0.011930949985980988, -0.006289646029472351, -0.0006483420729637146, 0.004992961883544922, 0.010634265840053558, 0.016275569796562195, 0.02191687375307083, 0.027558177709579468, 0.033199481666088104, 0.03884078562259674, 0.04448208957910538, 0.050123393535614014, 0.05576469749212265, 0.06140600144863129, 0.06704730540513992, 0.07268860936164856, 0.0783299133181572, 0.08397121727466583, 0.08961252123117447, 0.0952538251876831, 0.10089512914419174, 0.10653643310070038, 0.11217773705720901, 0.11781904101371765, 0.12346034497022629, 0.12910164892673492, 0.13474294543266296, 0.1403842568397522]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 0.0, 2.0, 6.0, 0.0, 4.0, 6.0, 6.0, 8.0, 10.0, 6.0, 4.0, 8.0, 6.0, 14.0, 8.0, 16.0, 6.0, 16.0, 23.0, 43.0, 212.0, 26896.0, 4166108.0, 612.0, 70.0, 35.0, 17.0, 26.0, 20.0, 18.0, 11.0, 13.0, 10.0, 8.0, 8.0, 10.0, 6.0, 2.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.67822265625, -0.6604537963867188, -0.6426849365234375, -0.6249160766601562, -0.607147216796875, -0.5893783569335938, -0.5716094970703125, -0.5538406372070312, -0.53607177734375, -0.5183029174804688, -0.5005340576171875, -0.48276519775390625, -0.464996337890625, -0.44722747802734375, -0.4294586181640625, -0.41168975830078125, -0.3939208984375, -0.37615203857421875, -0.3583831787109375, -0.34061431884765625, -0.322845458984375, -0.30507659912109375, -0.2873077392578125, -0.26953887939453125, -0.25177001953125, -0.23400115966796875, -0.2162322998046875, -0.19846343994140625, -0.180694580078125, -0.16292572021484375, -0.1451568603515625, -0.12738800048828125, -0.109619140625, -0.09185028076171875, -0.0740814208984375, -0.05631256103515625, -0.038543701171875, -0.02077484130859375, -0.0030059814453125, 0.01476287841796875, 0.03253173828125, 0.05030059814453125, 0.0680694580078125, 0.08583831787109375, 0.103607177734375, 0.12137603759765625, 0.1391448974609375, 0.15691375732421875, 0.1746826171875, 0.19245147705078125, 0.2102203369140625, 0.22798919677734375, 0.245758056640625, 0.26352691650390625, 0.2812957763671875, 0.29906463623046875, 0.31683349609375, 0.33460235595703125, 0.3523712158203125, 0.37014007568359375, 0.387908935546875, 0.40567779541015625, 0.4234466552734375, 0.44121551513671875, 0.458984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 11.0, 8.0, 10.0, 17.0, 25.0, 57.0, 91.0, 115.0, 142.0, 145.0, 107.0, 77.0, 61.0, 30.0, 26.0, 17.0, 18.0, 15.0, 3.0, 7.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003326416015625, -0.003219783306121826, -0.0031131505966186523, -0.0030065178871154785, -0.0028998851776123047, -0.002793252468109131, -0.002686619758605957, -0.002579987049102783, -0.0024733543395996094, -0.0023667216300964355, -0.0022600889205932617, -0.002153456211090088, -0.002046823501586914, -0.0019401907920837402, -0.0018335580825805664, -0.0017269253730773926, -0.0016202926635742188, -0.001513659954071045, -0.001407027244567871, -0.0013003945350646973, -0.0011937618255615234, -0.0010871291160583496, -0.0009804964065551758, -0.000873863697052002, -0.0007672309875488281, -0.0006605982780456543, -0.0005539655685424805, -0.00044733285903930664, -0.0003407001495361328, -0.00023406744003295898, -0.00012743473052978516, -2.0802021026611328e-05, 8.58306884765625e-05, 0.00019246339797973633, 0.00029909610748291016, 0.000405728816986084, 0.0005123615264892578, 0.0006189942359924316, 0.0007256269454956055, 0.0008322596549987793, 0.0009388923645019531, 0.001045525074005127, 0.0011521577835083008, 0.0012587904930114746, 0.0013654232025146484, 0.0014720559120178223, 0.001578688621520996, 0.00168532133102417, 0.0017919540405273438, 0.0018985867500305176, 0.0020052194595336914, 0.0021118521690368652, 0.002218484878540039, 0.002325117588043213, 0.0024317502975463867, 0.0025383830070495605, 0.0026450157165527344, 0.002751648426055908, 0.002858281135559082, 0.002964913845062256, 0.0030715465545654297, 0.0031781792640686035, 0.0032848119735717773, 0.003391444683074951, 0.003498077392578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 8.0, 18.0, 9.0, 28.0, 35.0, 61.0, 80.0, 121.0, 188.0, 223.0, 570.0, 3211691.0, 979834.0, 574.0, 215.0, 147.0, 143.0, 118.0, 64.0, 52.0, 45.0, 12.0, 17.0, 7.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.208740234375, -0.19879150390625, -0.1888427734375, -0.17889404296875, -0.1689453125, -0.15899658203125, -0.1490478515625, -0.13909912109375, -0.129150390625, -0.11920166015625, -0.1092529296875, -0.09930419921875, -0.08935546875, -0.07940673828125, -0.0694580078125, -0.05950927734375, -0.049560546875, -0.03961181640625, -0.0296630859375, -0.01971435546875, -0.009765625, 0.00018310546875, 0.0101318359375, 0.02008056640625, 0.030029296875, 0.03997802734375, 0.0499267578125, 0.05987548828125, 0.06982421875, 0.07977294921875, 0.0897216796875, 0.09967041015625, 0.109619140625, 0.11956787109375, 0.1295166015625, 0.13946533203125, 0.1494140625, 0.15936279296875, 0.1693115234375, 0.17926025390625, 0.189208984375, 0.19915771484375, 0.2091064453125, 0.21905517578125, 0.22900390625, 0.23895263671875, 0.2489013671875, 0.25885009765625, 0.268798828125, 0.27874755859375, 0.2886962890625, 0.29864501953125, 0.30859375, 0.31854248046875, 0.3284912109375, 0.33843994140625, 0.348388671875, 0.35833740234375, 0.3682861328125, 0.37823486328125, 0.38818359375, 0.39813232421875, 0.4080810546875, 0.41802978515625, 0.427978515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 7.0, 33.0, 125.0, 2498.0, 1295.0, 88.0, 32.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005390167236328125, -0.0044800639152526855, -0.003569960594177246, -0.0026598572731018066, -0.0017497539520263672, -0.0008396506309509277, 7.045269012451172e-05, 0.0009805560111999512, 0.0018906593322753906, 0.00280076265335083, 0.0037108659744262695, 0.004620969295501709, 0.0055310726165771484, 0.006441175937652588, 0.007351279258728027, 0.008261382579803467, 0.009171485900878906, 0.010081589221954346, 0.010991692543029785, 0.011901795864105225, 0.012811899185180664, 0.013722002506256104, 0.014632105827331543, 0.015542209148406982, 0.016452312469482422, 0.01736241579055786, 0.0182725191116333, 0.01918262243270874, 0.02009272575378418, 0.02100282907485962, 0.02191293239593506, 0.022823035717010498, 0.023733139038085938, 0.024643242359161377, 0.025553345680236816, 0.026463449001312256, 0.027373552322387695, 0.028283655643463135, 0.029193758964538574, 0.030103862285614014, 0.031013965606689453, 0.03192406892776489, 0.03283417224884033, 0.03374427556991577, 0.03465437889099121, 0.03556448221206665, 0.03647458553314209, 0.03738468885421753, 0.03829479217529297, 0.03920489549636841, 0.04011499881744385, 0.04102510213851929, 0.04193520545959473, 0.042845308780670166, 0.043755412101745605, 0.044665515422821045, 0.045575618743896484, 0.046485722064971924, 0.04739582538604736, 0.0483059287071228, 0.04921603202819824, 0.05012613534927368, 0.05103623867034912, 0.05194634199142456, 0.0528564453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 26.0, 119.0, 649.0, 176.0, 18.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5053959488868713, -0.48323574662208557, -0.4610755145549774, -0.43891531229019165, -0.4167550802230835, -0.39459487795829773, -0.37243467569351196, -0.3502744436264038, -0.32811424136161804, -0.3059540390968323, -0.2837938070297241, -0.26163360476493835, -0.2394733875989914, -0.21731317043304443, -0.19515296816825867, -0.1729927510023117, -0.15083253383636475, -0.12867231667041779, -0.10651210695505142, -0.08435189723968506, -0.0621916800737381, -0.04003146290779114, -0.01787126064300537, 0.004288956522941589, 0.02644917368888855, 0.04860938712954521, 0.07076960057020187, 0.09292981028556824, 0.1150900274515152, 0.13725024461746216, 0.15941044688224792, 0.18157066404819489, 0.20373082160949707, 0.22589103877544403, 0.248051255941391, 0.27021145820617676, 0.2923716902732849, 0.3145318925380707, 0.33669209480285645, 0.3588523268699646, 0.38101252913475037, 0.40317273139953613, 0.4253329634666443, 0.44749316573143005, 0.4696533679962158, 0.491813600063324, 0.5139738321304321, 0.5361340045928955, 0.5582942366600037, 0.5804544687271118, 0.6026146411895752, 0.6247748732566833, 0.6469351053237915, 0.6690952777862549, 0.691255509853363, 0.7134157419204712, 0.7355759143829346, 0.7577361464500427, 0.7798963189125061, 0.8020565509796143, 0.8242167830467224, 0.8463770151138306, 0.868537187576294, 0.8906974196434021, 0.9128576517105103]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 12.0, 27.0, 89.0, 165.0, 271.0, 231.0, 130.0, 59.0, 23.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22550296783447266, -0.20513667166233063, -0.1847703754901886, -0.16440406441688538, -0.14403776824474335, -0.12367147207260132, -0.10330516844987869, -0.08293886482715607, -0.06257256865501404, -0.04220626875758171, -0.021839968860149384, -0.0014736689627170563, 0.01889263093471527, 0.0392589271068573, 0.059625230729579926, 0.07999153435230255, 0.10035783052444458, 0.12072412669658661, 0.14109042286872864, 0.16145673394203186, 0.1818230301141739, 0.20218932628631592, 0.22255563735961914, 0.24292193353176117, 0.2632882297039032, 0.2836545407772064, 0.30402082204818726, 0.3243871331214905, 0.3447534441947937, 0.36511972546577454, 0.38548603653907776, 0.4058523178100586, 0.4262186288833618, 0.44658493995666504, 0.4669512212276459, 0.4873175323009491, 0.5076838135719299, 0.5280501246452332, 0.5484164357185364, 0.5687827467918396, 0.589148998260498, 0.6095153093338013, 0.6298816204071045, 0.6502478718757629, 0.6706141829490662, 0.6909804940223694, 0.7113468050956726, 0.7317131161689758, 0.752079427242279, 0.7724457383155823, 0.7928120493888855, 0.813178300857544, 0.8335446119308472, 0.8539109230041504, 0.8742772340774536, 0.8946435451507568, 0.9150098562240601, 0.9353761672973633, 0.9557424783706665, 0.976108729839325, 0.9964750409126282, 1.0168414115905762, 1.0372076034545898, 1.057573914527893, 1.0779402256011963]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 6.0, 6.0, 8.0, 10.0, 16.0, 19.0, 23.0, 30.0, 33.0, 39.0, 50.0, 46.0, 52.0, 57.0, 90.0, 1047111.0, 533.0, 64.0, 69.0, 55.0, 38.0, 35.0, 23.0, 28.0, 13.0, 17.0, 16.0, 10.0, 10.0, 10.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.17578125, -2.1163482666015625, -2.056915283203125, -1.9974822998046875, -1.93804931640625, -1.8786163330078125, -1.819183349609375, -1.7597503662109375, -1.7003173828125, -1.6408843994140625, -1.581451416015625, -1.5220184326171875, -1.46258544921875, -1.4031524658203125, -1.343719482421875, -1.2842864990234375, -1.224853515625, -1.1654205322265625, -1.105987548828125, -1.0465545654296875, -0.98712158203125, -0.9276885986328125, -0.868255615234375, -0.8088226318359375, -0.7493896484375, -0.6899566650390625, -0.630523681640625, -0.5710906982421875, -0.51165771484375, -0.4522247314453125, -0.392791748046875, -0.3333587646484375, -0.27392578125, -0.2144927978515625, -0.155059814453125, -0.0956268310546875, -0.03619384765625, 0.0232391357421875, 0.082672119140625, 0.1421051025390625, 0.2015380859375, 0.2609710693359375, 0.320404052734375, 0.3798370361328125, 0.43927001953125, 0.4987030029296875, 0.558135986328125, 0.6175689697265625, 0.677001953125, 0.7364349365234375, 0.795867919921875, 0.8553009033203125, 0.91473388671875, 0.9741668701171875, 1.033599853515625, 1.0930328369140625, 1.1524658203125, 1.2118988037109375, 1.271331787109375, 1.3307647705078125, 1.39019775390625, 1.4496307373046875, 1.509063720703125, 1.5684967041015625, 1.6279296875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [50.0, 766.0, 202.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00855255126953125, -0.0037001371383666992, 0.0011522769927978516, 0.006004691123962402, 0.010857105255126953, 0.015709519386291504, 0.020561933517456055, 0.025414347648620605, 0.030266761779785156, 0.03511917591094971, 0.03997159004211426, 0.04482400417327881, 0.04967641830444336, 0.05452883243560791, 0.05938124656677246, 0.06423366069793701, 0.06908607482910156, 0.07393848896026611, 0.07879090309143066, 0.08364331722259521, 0.08849573135375977, 0.09334814548492432, 0.09820055961608887, 0.10305297374725342, 0.10790538787841797, 0.11275780200958252, 0.11761021614074707, 0.12246263027191162, 0.12731504440307617, 0.13216745853424072, 0.13701987266540527, 0.14187228679656982, 0.14672470092773438, 0.15157711505889893, 0.15642952919006348, 0.16128194332122803, 0.16613435745239258, 0.17098677158355713, 0.17583918571472168, 0.18069159984588623, 0.18554401397705078, 0.19039642810821533, 0.19524884223937988, 0.20010125637054443, 0.20495367050170898, 0.20980608463287354, 0.21465849876403809, 0.21951091289520264, 0.2243633270263672, 0.22921574115753174, 0.2340681552886963, 0.23892056941986084, 0.2437729835510254, 0.24862539768218994, 0.2534778118133545, 0.25833022594451904, 0.2631826400756836, 0.26803505420684814, 0.2728874683380127, 0.27773988246917725, 0.2825922966003418, 0.28744471073150635, 0.2922971248626709, 0.29714953899383545, 0.302001953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 5.0, 14.0, 10.0, 18.0, 23.0, 35.0, 55.0, 76.0, 139.0, 198.0, 323.0, 597.0, 1113.0, 2408.0, 5776.0, 17418.0, 65934.0, 572492.0, 310921.0, 48234.0, 13458.0, 4809.0, 2074.0, 1026.0, 559.0, 280.0, 176.0, 99.0, 80.0, 61.0, 41.0, 24.0, 20.0, 15.0, 11.0, 5.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.323974609375, -0.31412506103515625, -0.3042755126953125, -0.29442596435546875, -0.284576416015625, -0.27472686767578125, -0.2648773193359375, -0.25502777099609375, -0.24517822265625, -0.23532867431640625, -0.2254791259765625, -0.21562957763671875, -0.205780029296875, -0.19593048095703125, -0.1860809326171875, -0.17623138427734375, -0.1663818359375, -0.15653228759765625, -0.1466827392578125, -0.13683319091796875, -0.126983642578125, -0.11713409423828125, -0.1072845458984375, -0.09743499755859375, -0.08758544921875, -0.07773590087890625, -0.0678863525390625, -0.05803680419921875, -0.048187255859375, -0.03833770751953125, -0.0284881591796875, -0.01863861083984375, -0.0087890625, 0.00106048583984375, 0.0109100341796875, 0.02075958251953125, 0.030609130859375, 0.04045867919921875, 0.0503082275390625, 0.06015777587890625, 0.07000732421875, 0.07985687255859375, 0.0897064208984375, 0.09955596923828125, 0.109405517578125, 0.11925506591796875, 0.1291046142578125, 0.13895416259765625, 0.1488037109375, 0.15865325927734375, 0.1685028076171875, 0.17835235595703125, 0.188201904296875, 0.19805145263671875, 0.2079010009765625, 0.21775054931640625, 0.22760009765625, 0.23744964599609375, 0.2472991943359375, 0.25714874267578125, 0.266998291015625, 0.27684783935546875, 0.2866973876953125, 0.29654693603515625, 0.306396484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 8.0, 12.0, 15.0, 15.0, 18.0, 36.0, 36.0, 29.0, 40.0, 65.0, 85.0, 69.0, 68.0, 76.0, 68.0, 56.0, 59.0, 44.0, 44.0, 40.0, 20.0, 13.0, 19.0, 8.0, 12.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.263916015625, -0.25655364990234375, -0.2491912841796875, -0.24182891845703125, -0.234466552734375, -0.22710418701171875, -0.2197418212890625, -0.21237945556640625, -0.20501708984375, -0.19765472412109375, -0.1902923583984375, -0.18292999267578125, -0.175567626953125, -0.16820526123046875, -0.1608428955078125, -0.15348052978515625, -0.1461181640625, -0.13875579833984375, -0.1313934326171875, -0.12403106689453125, -0.116668701171875, -0.10930633544921875, -0.1019439697265625, -0.09458160400390625, -0.08721923828125, -0.07985687255859375, -0.0724945068359375, -0.06513214111328125, -0.057769775390625, -0.05040740966796875, -0.0430450439453125, -0.03568267822265625, -0.0283203125, -0.02095794677734375, -0.0135955810546875, -0.00623321533203125, 0.001129150390625, 0.00849151611328125, 0.0158538818359375, 0.02321624755859375, 0.03057861328125, 0.03794097900390625, 0.0453033447265625, 0.05266571044921875, 0.060028076171875, 0.06739044189453125, 0.0747528076171875, 0.08211517333984375, 0.0894775390625, 0.09683990478515625, 0.1042022705078125, 0.11156463623046875, 0.118927001953125, 0.12628936767578125, 0.1336517333984375, 0.14101409912109375, 0.14837646484375, 0.15573883056640625, 0.1631011962890625, 0.17046356201171875, 0.177825927734375, 0.18518829345703125, 0.1925506591796875, 0.19991302490234375, 0.207275390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 9.0, 22.0, 24.0, 37.0, 52.0, 85.0, 150.0, 271.0, 475.0, 1108.0, 3399.0, 15940.0, 245110.0, 739376.0, 33891.0, 5539.0, 1521.0, 663.0, 312.0, 195.0, 101.0, 80.0, 50.0, 31.0, 24.0, 18.0, 13.0, 10.0, 4.0, 5.0, 1.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.327880859375, -0.3176918029785156, -0.30750274658203125, -0.2973136901855469, -0.2871246337890625, -0.2769355773925781, -0.26674652099609375, -0.2565574645996094, -0.246368408203125, -0.23617935180664062, -0.22599029541015625, -0.21580123901367188, -0.2056121826171875, -0.19542312622070312, -0.18523406982421875, -0.17504501342773438, -0.16485595703125, -0.15466690063476562, -0.14447784423828125, -0.13428878784179688, -0.1240997314453125, -0.11391067504882812, -0.10372161865234375, -0.09353256225585938, -0.083343505859375, -0.07315444946289062, -0.06296539306640625, -0.052776336669921875, -0.0425872802734375, -0.032398223876953125, -0.02220916748046875, -0.012020111083984375, -0.0018310546875, 0.008358001708984375, 0.01854705810546875, 0.028736114501953125, 0.0389251708984375, 0.049114227294921875, 0.05930328369140625, 0.06949234008789062, 0.079681396484375, 0.08987045288085938, 0.10005950927734375, 0.11024856567382812, 0.1204376220703125, 0.13062667846679688, 0.14081573486328125, 0.15100479125976562, 0.16119384765625, 0.17138290405273438, 0.18157196044921875, 0.19176101684570312, 0.2019500732421875, 0.21213912963867188, 0.22232818603515625, 0.23251724243164062, 0.242706298828125, 0.2528953552246094, 0.26308441162109375, 0.2732734680175781, 0.2834625244140625, 0.2936515808105469, 0.30384063720703125, 0.3140296936035156, 0.32421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 10.0, 3.0, 6.0, 5.0, 7.0, 7.0, 12.0, 18.0, 20.0, 25.0, 47.0, 66.0, 96.0, 140.0, 149.0, 93.0, 76.0, 58.0, 49.0, 20.0, 19.0, 14.0, 7.0, 8.0, 11.0, 6.0, 6.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002460479736328125, -0.00023922696709632874, -0.00023240596055984497, -0.0002255849540233612, -0.00021876394748687744, -0.00021194294095039368, -0.0002051219344139099, -0.00019830092787742615, -0.00019147992134094238, -0.00018465891480445862, -0.00017783790826797485, -0.0001710169017314911, -0.00016419589519500732, -0.00015737488865852356, -0.0001505538821220398, -0.00014373287558555603, -0.00013691186904907227, -0.0001300908625125885, -0.00012326985597610474, -0.00011644884943962097, -0.00010962784290313721, -0.00010280683636665344, -9.598582983016968e-05, -8.916482329368591e-05, -8.234381675720215e-05, -7.552281022071838e-05, -6.870180368423462e-05, -6.188079714775085e-05, -5.505979061126709e-05, -4.8238784074783325e-05, -4.141777753829956e-05, -3.4596771001815796e-05, -2.777576446533203e-05, -2.0954757928848267e-05, -1.4133751392364502e-05, -7.312744855880737e-06, -4.917383193969727e-07, 6.329268217086792e-06, 1.3150274753570557e-05, 1.997128129005432e-05, 2.6792287826538086e-05, 3.361329436302185e-05, 4.0434300899505615e-05, 4.725530743598938e-05, 5.4076313972473145e-05, 6.089732050895691e-05, 6.771832704544067e-05, 7.453933358192444e-05, 8.13603401184082e-05, 8.818134665489197e-05, 9.500235319137573e-05, 0.0001018233597278595, 0.00010864436626434326, 0.00011546537280082703, 0.0001222863793373108, 0.00012910738587379456, 0.00013592839241027832, 0.00014274939894676208, 0.00014957040548324585, 0.00015639141201972961, 0.00016321241855621338, 0.00017003342509269714, 0.0001768544316291809, 0.00018367543816566467, 0.00019049644470214844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 14.0, 18.0, 39.0, 31.0, 56.0, 89.0, 146.0, 254.0, 515.0, 955.0, 2237.0, 5823.0, 22359.0, 576117.0, 410045.0, 20160.0, 5572.0, 2102.0, 929.0, 446.0, 239.0, 139.0, 73.0, 59.0, 31.0, 22.0, 19.0, 6.0, 12.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.50830078125, -0.4941673278808594, -0.48003387451171875, -0.4659004211425781, -0.4517669677734375, -0.4376335144042969, -0.42350006103515625, -0.4093666076660156, -0.395233154296875, -0.3810997009277344, -0.36696624755859375, -0.3528327941894531, -0.3386993408203125, -0.3245658874511719, -0.31043243408203125, -0.2962989807128906, -0.28216552734375, -0.2680320739746094, -0.25389862060546875, -0.23976516723632812, -0.2256317138671875, -0.21149826049804688, -0.19736480712890625, -0.18323135375976562, -0.169097900390625, -0.15496444702148438, -0.14083099365234375, -0.12669754028320312, -0.1125640869140625, -0.09843063354492188, -0.08429718017578125, -0.07016372680664062, -0.0560302734375, -0.041896820068359375, -0.02776336669921875, -0.013629913330078125, 0.0005035400390625, 0.014636993408203125, 0.02877044677734375, 0.042903900146484375, 0.057037353515625, 0.07117080688476562, 0.08530426025390625, 0.09943771362304688, 0.1135711669921875, 0.12770462036132812, 0.14183807373046875, 0.15597152709960938, 0.17010498046875, 0.18423843383789062, 0.19837188720703125, 0.21250534057617188, 0.2266387939453125, 0.24077224731445312, 0.25490570068359375, 0.2690391540527344, 0.283172607421875, 0.2973060607910156, 0.31143951416015625, 0.3255729675292969, 0.3397064208984375, 0.3538398742675781, 0.36797332763671875, 0.3821067810058594, 0.396240234375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 11.0, 6.0, 12.0, 15.0, 22.0, 34.0, 71.0, 248.0, 297.0, 130.0, 50.0, 25.0, 16.0, 11.0, 9.0, 6.0, 4.0, 7.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.286376953125, -0.27925682067871094, -0.2721366882324219, -0.2650165557861328, -0.25789642333984375, -0.2507762908935547, -0.24365615844726562, -0.23653602600097656, -0.2294158935546875, -0.22229576110839844, -0.21517562866210938, -0.2080554962158203, -0.20093536376953125, -0.1938152313232422, -0.18669509887695312, -0.17957496643066406, -0.172454833984375, -0.16533470153808594, -0.15821456909179688, -0.1510944366455078, -0.14397430419921875, -0.1368541717529297, -0.12973403930664062, -0.12261390686035156, -0.1154937744140625, -0.10837364196777344, -0.10125350952148438, -0.09413337707519531, -0.08701324462890625, -0.07989311218261719, -0.07277297973632812, -0.06565284729003906, -0.05853271484375, -0.05141258239746094, -0.044292449951171875, -0.03717231750488281, -0.03005218505859375, -0.022932052612304688, -0.015811920166015625, -0.008691787719726562, -0.0015716552734375, 0.0055484771728515625, 0.012668609619140625, 0.019788742065429688, 0.02690887451171875, 0.03402900695800781, 0.041149139404296875, 0.04826927185058594, 0.055389404296875, 0.06250953674316406, 0.06962966918945312, 0.07674980163574219, 0.08386993408203125, 0.09099006652832031, 0.09811019897460938, 0.10523033142089844, 0.1123504638671875, 0.11947059631347656, 0.12659072875976562, 0.1337108612060547, 0.14083099365234375, 0.1479511260986328, 0.15507125854492188, 0.16219139099121094, 0.1693115234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 11.0, 19.0, 42.0, 83.0, 315.0, 418.0, 90.0, 17.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587178945541382, -2.4654762744903564, -2.343773603439331, -2.2220709323883057, -2.1003682613372803, -1.9786655902862549, -1.8569629192352295, -1.735260248184204, -1.6135575771331787, -1.4918549060821533, -1.370152235031128, -1.2484495639801025, -1.1267468929290771, -1.0050442218780518, -0.8833415508270264, -0.761638879776001, -0.6399362087249756, -0.5182335376739502, -0.3965308666229248, -0.2748281955718994, -0.15312552452087402, -0.03142285346984863, 0.09027981758117676, 0.21198248863220215, 0.33368515968322754, 0.45538783073425293, 0.5770905017852783, 0.6987931728363037, 0.8204958438873291, 0.9421985149383545, 1.0639011859893799, 1.1856038570404053, 1.3073062896728516, 1.429008960723877, 1.5507116317749023, 1.6724143028259277, 1.7941169738769531, 1.9158196449279785, 2.037522315979004, 2.1592249870300293, 2.2809276580810547, 2.40263032913208, 2.5243330001831055, 2.646035671234131, 2.7677383422851562, 2.8894410133361816, 3.011143684387207, 3.1328463554382324, 3.254549026489258, 3.376251697540283, 3.4979543685913086, 3.619657039642334, 3.7413597106933594, 3.8630623817443848, 3.98476505279541, 4.1064677238464355, 4.228170394897461, 4.349873065948486, 4.471575736999512, 4.593278408050537, 4.7149810791015625, 4.836683750152588, 4.958386421203613, 5.080089092254639, 5.201791763305664]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 4.0, 13.0, 14.0, 12.0, 33.0, 30.0, 38.0, 45.0, 76.0, 83.0, 70.0, 85.0, 83.0, 71.0, 59.0, 64.0, 48.0, 44.0, 41.0, 29.0, 21.0, 14.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0924594402313232, -1.035036563873291, -0.977613627910614, -0.920190691947937, -0.8627678155899048, -0.8053449392318726, -0.7479220032691956, -0.6904990673065186, -0.6330761909484863, -0.5756533145904541, -0.5182303786277771, -0.4608074724674225, -0.40338456630706787, -0.34596166014671326, -0.28853875398635864, -0.23111584782600403, -0.17369294166564941, -0.1162700355052948, -0.058847129344940186, -0.0014242231845855713, 0.05599868297576904, 0.11342158913612366, 0.17084449529647827, 0.22826740145683289, 0.2856903076171875, 0.3431132137775421, 0.40053611993789673, 0.45795902609825134, 0.515381932258606, 0.5728048086166382, 0.6302277445793152, 0.6876506805419922, 0.7450735569000244, 0.8024964332580566, 0.8599193692207336, 0.9173423051834106, 0.9747651815414429, 1.032188057899475, 1.0896110534667969, 1.147033929824829, 1.2044568061828613, 1.2618796825408936, 1.3193025588989258, 1.3767255544662476, 1.4341484308242798, 1.491571307182312, 1.5489943027496338, 1.606417179107666, 1.6638400554656982, 1.7212629318237305, 1.7786858081817627, 1.8361088037490845, 1.8935316801071167, 1.950954556465149, 2.0083775520324707, 2.065800428390503, 2.123223304748535, 2.1806461811065674, 2.2380690574645996, 2.295491933822632, 2.352914810180664, 2.4103379249572754, 2.4677608013153076, 2.52518367767334, 2.582606554031372]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 35.0, 134.0, 13743.0, 4179190.0, 596.0, 237.0, 119.0, 92.0, 60.0, 36.0, 18.0, 21.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89111328125, -0.6778488159179688, -0.4645843505859375, -0.25131988525390625, -0.038055419921875, 0.17520904541015625, 0.3884735107421875, 0.6017379760742188, 0.81500244140625, 1.0282669067382812, 1.2415313720703125, 1.4547958374023438, 1.668060302734375, 1.8813247680664062, 2.0945892333984375, 2.3078536987304688, 2.5211181640625, 2.7343826293945312, 2.9476470947265625, 3.1609115600585938, 3.374176025390625, 3.5874404907226562, 3.8007049560546875, 4.013969421386719, 4.22723388671875, 4.440498352050781, 4.6537628173828125, 4.867027282714844, 5.080291748046875, 5.293556213378906, 5.5068206787109375, 5.720085144042969, 5.933349609375, 6.146614074707031, 6.3598785400390625, 6.573143005371094, 6.786407470703125, 6.999671936035156, 7.2129364013671875, 7.426200866699219, 7.63946533203125, 7.852729797363281, 8.065994262695312, 8.279258728027344, 8.492523193359375, 8.705787658691406, 8.919052124023438, 9.132316589355469, 9.3455810546875, 9.558845520019531, 9.772109985351562, 9.985374450683594, 10.198638916015625, 10.411903381347656, 10.625167846679688, 10.838432312011719, 11.05169677734375, 11.264961242675781, 11.478225708007812, 11.691490173339844, 11.904754638671875, 12.118019104003906, 12.331283569335938, 12.544548034667969, 12.7578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 27.0, 104.0, 298.0, 351.0, 177.0, 48.0, 11.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023223876953125, -0.017798900604248047, -0.012373924255371094, -0.006948947906494141, -0.0015239715576171875, 0.0039010047912597656, 0.009325981140136719, 0.014750957489013672, 0.020175933837890625, 0.025600910186767578, 0.03102588653564453, 0.036450862884521484, 0.04187583923339844, 0.04730081558227539, 0.052725791931152344, 0.0581507682800293, 0.06357574462890625, 0.0690007209777832, 0.07442569732666016, 0.07985067367553711, 0.08527565002441406, 0.09070062637329102, 0.09612560272216797, 0.10155057907104492, 0.10697555541992188, 0.11240053176879883, 0.11782550811767578, 0.12325048446655273, 0.1286754608154297, 0.13410043716430664, 0.1395254135131836, 0.14495038986206055, 0.1503753662109375, 0.15580034255981445, 0.1612253189086914, 0.16665029525756836, 0.1720752716064453, 0.17750024795532227, 0.18292522430419922, 0.18835020065307617, 0.19377517700195312, 0.19920015335083008, 0.20462512969970703, 0.21005010604858398, 0.21547508239746094, 0.2209000587463379, 0.22632503509521484, 0.2317500114440918, 0.23717498779296875, 0.2425999641418457, 0.24802494049072266, 0.2534499168395996, 0.25887489318847656, 0.2642998695373535, 0.26972484588623047, 0.2751498222351074, 0.2805747985839844, 0.28599977493286133, 0.2914247512817383, 0.29684972763061523, 0.3022747039794922, 0.30769968032836914, 0.3131246566772461, 0.31854963302612305, 0.323974609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 13.0, 16.0, 23.0, 33.0, 58.0, 89.0, 176.0, 352.0, 813.0, 2949.0, 19311.0, 4098754.0, 66214.0, 3737.0, 1010.0, 335.0, 170.0, 92.0, 62.0, 35.0, 25.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.2980499267578125, -2.238677978515625, -2.1793060302734375, -2.11993408203125, -2.0605621337890625, -2.001190185546875, -1.9418182373046875, -1.8824462890625, -1.8230743408203125, -1.763702392578125, -1.7043304443359375, -1.64495849609375, -1.5855865478515625, -1.526214599609375, -1.4668426513671875, -1.407470703125, -1.3480987548828125, -1.288726806640625, -1.2293548583984375, -1.16998291015625, -1.1106109619140625, -1.051239013671875, -0.9918670654296875, -0.9324951171875, -0.8731231689453125, -0.813751220703125, -0.7543792724609375, -0.69500732421875, -0.6356353759765625, -0.576263427734375, -0.5168914794921875, -0.45751953125, -0.3981475830078125, -0.338775634765625, -0.2794036865234375, -0.22003173828125, -0.1606597900390625, -0.101287841796875, -0.0419158935546875, 0.0174560546875, 0.0768280029296875, 0.136199951171875, 0.1955718994140625, 0.25494384765625, 0.3143157958984375, 0.373687744140625, 0.4330596923828125, 0.492431640625, 0.5518035888671875, 0.611175537109375, 0.6705474853515625, 0.72991943359375, 0.7892913818359375, 0.848663330078125, 0.9080352783203125, 0.9674072265625, 1.0267791748046875, 1.086151123046875, 1.1455230712890625, 1.20489501953125, 1.2642669677734375, 1.323638916015625, 1.3830108642578125, 1.4423828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 15.0, 8.0, 16.0, 31.0, 39.0, 81.0, 158.0, 2431.0, 1116.0, 110.0, 40.0, 15.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.39052581787109375, -0.3816375732421875, -0.37274932861328125, -0.363861083984375, -0.35497283935546875, -0.3460845947265625, -0.33719635009765625, -0.32830810546875, -0.31941986083984375, -0.3105316162109375, -0.30164337158203125, -0.292755126953125, -0.28386688232421875, -0.2749786376953125, -0.26609039306640625, -0.2572021484375, -0.24831390380859375, -0.2394256591796875, -0.23053741455078125, -0.221649169921875, -0.21276092529296875, -0.2038726806640625, -0.19498443603515625, -0.18609619140625, -0.17720794677734375, -0.1683197021484375, -0.15943145751953125, -0.150543212890625, -0.14165496826171875, -0.1327667236328125, -0.12387847900390625, -0.114990234375, -0.10610198974609375, -0.0972137451171875, -0.08832550048828125, -0.079437255859375, -0.07054901123046875, -0.0616607666015625, -0.05277252197265625, -0.04388427734375, -0.03499603271484375, -0.0261077880859375, -0.01721954345703125, -0.008331298828125, 0.00055694580078125, 0.0094451904296875, 0.01833343505859375, 0.0272216796875, 0.03610992431640625, 0.0449981689453125, 0.05388641357421875, 0.062774658203125, 0.07166290283203125, 0.0805511474609375, 0.08943939208984375, 0.09832763671875, 0.10721588134765625, 0.1161041259765625, 0.12499237060546875, 0.133880615234375, 0.14276885986328125, 0.1516571044921875, 0.16054534912109375, 0.16943359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 22.0, 33.0, 79.0, 217.0, 431.0, 146.0, 42.0, 10.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462117910385132, -2.3997251987457275, -2.3373324871063232, -2.27493953704834, -2.2125468254089355, -2.1501541137695312, -2.087761402130127, -2.0253686904907227, -1.9629758596420288, -1.9005831480026245, -1.8381903171539307, -1.7757976055145264, -1.713404893875122, -1.6510120630264282, -1.588619351387024, -1.52622652053833, -1.4638338088989258, -1.4014410972595215, -1.3390482664108276, -1.2766555547714233, -1.214262843132019, -1.1518700122833252, -1.089477300643921, -1.0270845890045166, -0.9646918773651123, -0.9022991061210632, -0.8399063944816589, -0.7775136232376099, -0.7151208519935608, -0.6527280807495117, -0.5903353691101074, -0.5279425978660583, -0.4655498266220093, -0.4031570851802826, -0.3407643139362335, -0.27837157249450684, -0.21597881615161896, -0.15358605980873108, -0.0911933183670044, -0.028800547122955322, 0.03359219431877136, 0.09598495066165924, 0.15837770700454712, 0.2207704484462738, 0.2831631898880005, 0.34555596113204956, 0.40794870257377625, 0.4703414738178253, 0.532734215259552, 0.5951269865036011, 0.6575196981430054, 0.7199124693870544, 0.7823052406311035, 0.8446979522705078, 0.9070907235145569, 0.969483494758606, 1.0318762063980103, 1.0942689180374146, 1.1566617488861084, 1.2190544605255127, 1.281447172164917, 1.3438400030136108, 1.4062327146530151, 1.468625545501709, 1.5310182571411133]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 16.0, 12.0, 23.0, 20.0, 36.0, 53.0, 70.0, 84.0, 98.0, 88.0, 88.0, 69.0, 84.0, 75.0, 48.0, 43.0, 27.0, 19.0, 13.0, 12.0, 9.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2092745304107666, -1.174912691116333, -1.1405508518218994, -1.1061891317367554, -1.0718272924423218, -1.0374654531478882, -1.0031036138534546, -0.968741774559021, -0.9343799948692322, -0.9000181555747986, -0.8656563758850098, -0.8312945365905762, -0.7969326972961426, -0.7625709176063538, -0.7282090783119202, -0.6938472986221313, -0.6594854593276978, -0.6251236200332642, -0.5907618403434753, -0.5564000010490417, -0.5220382213592529, -0.48767638206481934, -0.45331454277038574, -0.41895273327827454, -0.38459092378616333, -0.3502291142940521, -0.3158673048019409, -0.2815054655075073, -0.24714365601539612, -0.2127818465232849, -0.1784200221300125, -0.1440581977367401, -0.10969632863998413, -0.07533451169729233, -0.040972694754600525, -0.006610877811908722, 0.02775093913078308, 0.06211274862289429, 0.09647457301616669, 0.1308363974094391, 0.1651982069015503, 0.1995600163936615, 0.2339218407869339, 0.2682836651802063, 0.3026454746723175, 0.3370072841644287, 0.3713691234588623, 0.4057309329509735, 0.4400927424430847, 0.4744545519351959, 0.5088163614273071, 0.5431782007217407, 0.5775400400161743, 0.6119018197059631, 0.6462636590003967, 0.6806254386901855, 0.7149872779846191, 0.7493491172790527, 0.7837108969688416, 0.8180727362632751, 0.852434515953064, 0.8867963552474976, 0.9211581945419312, 0.9555200338363647, 0.9898818135261536]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 17.0, 12.0, 19.0, 18.0, 25.0, 35.0, 29.0, 48.0, 61.0, 129.0, 572.0, 9393.0, 933074.0, 102208.0, 2281.0, 255.0, 73.0, 53.0, 41.0, 28.0, 19.0, 25.0, 16.0, 18.0, 21.0, 11.0, 9.0, 7.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6865234375, -1.6365814208984375, -1.586639404296875, -1.5366973876953125, -1.48675537109375, -1.4368133544921875, -1.386871337890625, -1.3369293212890625, -1.2869873046875, -1.2370452880859375, -1.187103271484375, -1.1371612548828125, -1.08721923828125, -1.0372772216796875, -0.987335205078125, -0.9373931884765625, -0.887451171875, -0.8375091552734375, -0.787567138671875, -0.7376251220703125, -0.68768310546875, -0.6377410888671875, -0.587799072265625, -0.5378570556640625, -0.4879150390625, -0.4379730224609375, -0.388031005859375, -0.3380889892578125, -0.28814697265625, -0.2382049560546875, -0.188262939453125, -0.1383209228515625, -0.08837890625, -0.0384368896484375, 0.011505126953125, 0.0614471435546875, 0.11138916015625, 0.1613311767578125, 0.211273193359375, 0.2612152099609375, 0.3111572265625, 0.3610992431640625, 0.411041259765625, 0.4609832763671875, 0.51092529296875, 0.5608673095703125, 0.610809326171875, 0.6607513427734375, 0.710693359375, 0.7606353759765625, 0.810577392578125, 0.8605194091796875, 0.91046142578125, 0.9604034423828125, 1.010345458984375, 1.0602874755859375, 1.1102294921875, 1.1601715087890625, 1.210113525390625, 1.2600555419921875, 1.30999755859375, 1.3599395751953125, 1.409881591796875, 1.4598236083984375, 1.509765625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 24.0, 69.0, 137.0, 283.0, 252.0, 156.0, 62.0, 22.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047149658203125, -0.04127836227416992, -0.035407066345214844, -0.029535770416259766, -0.023664474487304688, -0.01779317855834961, -0.011921882629394531, -0.006050586700439453, -0.000179290771484375, 0.005692005157470703, 0.011563301086425781, 0.01743459701538086, 0.023305892944335938, 0.029177188873291016, 0.035048484802246094, 0.04091978073120117, 0.04679107666015625, 0.05266237258911133, 0.058533668518066406, 0.06440496444702148, 0.07027626037597656, 0.07614755630493164, 0.08201885223388672, 0.0878901481628418, 0.09376144409179688, 0.09963274002075195, 0.10550403594970703, 0.11137533187866211, 0.11724662780761719, 0.12311792373657227, 0.12898921966552734, 0.13486051559448242, 0.1407318115234375, 0.14660310745239258, 0.15247440338134766, 0.15834569931030273, 0.1642169952392578, 0.1700882911682129, 0.17595958709716797, 0.18183088302612305, 0.18770217895507812, 0.1935734748840332, 0.19944477081298828, 0.20531606674194336, 0.21118736267089844, 0.21705865859985352, 0.2229299545288086, 0.22880125045776367, 0.23467254638671875, 0.24054384231567383, 0.2464151382446289, 0.252286434173584, 0.25815773010253906, 0.26402902603149414, 0.2699003219604492, 0.2757716178894043, 0.2816429138183594, 0.28751420974731445, 0.29338550567626953, 0.2992568016052246, 0.3051280975341797, 0.31099939346313477, 0.31687068939208984, 0.3227419853210449, 0.32861328125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 4.0, 5.0, 5.0, 7.0, 14.0, 19.0, 26.0, 23.0, 43.0, 54.0, 74.0, 89.0, 149.0, 205.0, 351.0, 639.0, 1297.0, 3724.0, 13764.0, 81292.0, 645779.0, 258087.0, 31476.0, 6928.0, 2154.0, 942.0, 478.0, 298.0, 158.0, 128.0, 80.0, 73.0, 55.0, 38.0, 28.0, 16.0, 16.0, 8.0, 8.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2730865478515625, -0.262481689453125, -0.2518768310546875, -0.24127197265625, -0.2306671142578125, -0.220062255859375, -0.2094573974609375, -0.1988525390625, -0.1882476806640625, -0.177642822265625, -0.1670379638671875, -0.15643310546875, -0.1458282470703125, -0.135223388671875, -0.1246185302734375, -0.114013671875, -0.1034088134765625, -0.092803955078125, -0.0821990966796875, -0.07159423828125, -0.0609893798828125, -0.050384521484375, -0.0397796630859375, -0.0291748046875, -0.0185699462890625, -0.007965087890625, 0.0026397705078125, 0.01324462890625, 0.0238494873046875, 0.034454345703125, 0.0450592041015625, 0.0556640625, 0.0662689208984375, 0.076873779296875, 0.0874786376953125, 0.09808349609375, 0.1086883544921875, 0.119293212890625, 0.1298980712890625, 0.1405029296875, 0.1511077880859375, 0.161712646484375, 0.1723175048828125, 0.18292236328125, 0.1935272216796875, 0.204132080078125, 0.2147369384765625, 0.225341796875, 0.2359466552734375, 0.246551513671875, 0.2571563720703125, 0.26776123046875, 0.2783660888671875, 0.288970947265625, 0.2995758056640625, 0.3101806640625, 0.3207855224609375, 0.331390380859375, 0.3419952392578125, 0.35260009765625, 0.3632049560546875, 0.373809814453125, 0.3844146728515625, 0.39501953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 4.0, 8.0, 8.0, 17.0, 15.0, 13.0, 16.0, 19.0, 31.0, 44.0, 42.0, 35.0, 50.0, 47.0, 48.0, 59.0, 42.0, 57.0, 50.0, 57.0, 39.0, 50.0, 37.0, 37.0, 30.0, 19.0, 22.0, 17.0, 19.0, 11.0, 14.0, 7.0, 10.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14498138427734375, -0.1390838623046875, -0.13318634033203125, -0.127288818359375, -0.12139129638671875, -0.1154937744140625, -0.10959625244140625, -0.10369873046875, -0.09780120849609375, -0.0919036865234375, -0.08600616455078125, -0.080108642578125, -0.07421112060546875, -0.0683135986328125, -0.06241607666015625, -0.0565185546875, -0.05062103271484375, -0.0447235107421875, -0.03882598876953125, -0.032928466796875, -0.02703094482421875, -0.0211334228515625, -0.01523590087890625, -0.00933837890625, -0.00344085693359375, 0.0024566650390625, 0.00835418701171875, 0.014251708984375, 0.02014923095703125, 0.0260467529296875, 0.03194427490234375, 0.037841796875, 0.04373931884765625, 0.0496368408203125, 0.05553436279296875, 0.061431884765625, 0.06732940673828125, 0.0732269287109375, 0.07912445068359375, 0.08502197265625, 0.09091949462890625, 0.0968170166015625, 0.10271453857421875, 0.108612060546875, 0.11450958251953125, 0.1204071044921875, 0.12630462646484375, 0.1322021484375, 0.13809967041015625, 0.1439971923828125, 0.14989471435546875, 0.155792236328125, 0.16168975830078125, 0.1675872802734375, 0.17348480224609375, 0.17938232421875, 0.18527984619140625, 0.1911773681640625, 0.19707489013671875, 0.202972412109375, 0.20886993408203125, 0.2147674560546875, 0.22066497802734375, 0.2265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 16.0, 18.0, 46.0, 67.0, 152.0, 316.0, 976.0, 5618.0, 342589.0, 689270.0, 7577.0, 1149.0, 427.0, 170.0, 71.0, 30.0, 19.0, 16.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472412109375, -0.4542884826660156, -0.43616485595703125, -0.4180412292480469, -0.3999176025390625, -0.3817939758300781, -0.36367034912109375, -0.3455467224121094, -0.327423095703125, -0.3092994689941406, -0.29117584228515625, -0.2730522155761719, -0.2549285888671875, -0.23680496215820312, -0.21868133544921875, -0.20055770874023438, -0.18243408203125, -0.16431045532226562, -0.14618682861328125, -0.12806320190429688, -0.1099395751953125, -0.09181594848632812, -0.07369232177734375, -0.055568695068359375, -0.037445068359375, -0.019321441650390625, -0.00119781494140625, 0.016925811767578125, 0.0350494384765625, 0.053173065185546875, 0.07129669189453125, 0.08942031860351562, 0.1075439453125, 0.12566757202148438, 0.14379119873046875, 0.16191482543945312, 0.1800384521484375, 0.19816207885742188, 0.21628570556640625, 0.23440933227539062, 0.252532958984375, 0.2706565856933594, 0.28878021240234375, 0.3069038391113281, 0.3250274658203125, 0.3431510925292969, 0.36127471923828125, 0.3793983459472656, 0.39752197265625, 0.4156455993652344, 0.43376922607421875, 0.4518928527832031, 0.4700164794921875, 0.4881401062011719, 0.5062637329101562, 0.5243873596191406, 0.542510986328125, 0.5606346130371094, 0.5787582397460938, 0.5968818664550781, 0.6150054931640625, 0.6331291198730469, 0.6512527465820312, 0.6693763732910156, 0.6875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 9.0, 4.0, 5.0, 10.0, 34.0, 52.0, 118.0, 219.0, 256.0, 148.0, 84.0, 42.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0007457733154296875, -0.0007314775139093399, -0.0007171817123889923, -0.0007028859108686447, -0.0006885901093482971, -0.0006742943078279495, -0.0006599985063076019, -0.0006457027047872543, -0.0006314069032669067, -0.0006171111017465591, -0.0006028153002262115, -0.000588519498705864, -0.0005742236971855164, -0.0005599278956651688, -0.0005456320941448212, -0.0005313362926244736, -0.000517040491104126, -0.0005027446895837784, -0.0004884488880634308, -0.0004741530865430832, -0.0004598572850227356, -0.000445561483502388, -0.0004312656819820404, -0.0004169698804616928, -0.0004026740789413452, -0.0003883782774209976, -0.00037408247590065, -0.00035978667438030243, -0.00034549087285995483, -0.00033119507133960724, -0.00031689926981925964, -0.00030260346829891205, -0.00028830766677856445, -0.00027401186525821686, -0.00025971606373786926, -0.00024542026221752167, -0.00023112446069717407, -0.00021682865917682648, -0.00020253285765647888, -0.0001882370561361313, -0.0001739412546157837, -0.0001596454530954361, -0.0001453496515750885, -0.0001310538500547409, -0.00011675804853439331, -0.00010246224701404572, -8.816644549369812e-05, -7.387064397335052e-05, -5.957484245300293e-05, -4.5279040932655334e-05, -3.098323941230774e-05, -1.6687437891960144e-05, -2.391636371612549e-06, 1.1904165148735046e-05, 2.619996666908264e-05, 4.049576818943024e-05, 5.479156970977783e-05, 6.908737123012543e-05, 8.338317275047302e-05, 9.767897427082062e-05, 0.00011197477579116821, 0.0001262705773115158, 0.0001405663788318634, 0.000154862180352211, 0.0001691579818725586]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 7.0, 17.0, 12.0, 38.0, 47.0, 90.0, 168.0, 312.0, 764.0, 2403.0, 11244.0, 148976.0, 829740.0, 46140.0, 5955.0, 1493.0, 584.0, 240.0, 117.0, 65.0, 50.0, 30.0, 12.0, 16.0, 13.0, 6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.260498046875, -0.249786376953125, -0.23907470703125, -0.228363037109375, -0.2176513671875, -0.206939697265625, -0.19622802734375, -0.185516357421875, -0.1748046875, -0.164093017578125, -0.15338134765625, -0.142669677734375, -0.1319580078125, -0.121246337890625, -0.11053466796875, -0.099822998046875, -0.089111328125, -0.078399658203125, -0.06768798828125, -0.056976318359375, -0.0462646484375, -0.035552978515625, -0.02484130859375, -0.014129638671875, -0.00341796875, 0.007293701171875, 0.01800537109375, 0.028717041015625, 0.0394287109375, 0.050140380859375, 0.06085205078125, 0.071563720703125, 0.082275390625, 0.092987060546875, 0.10369873046875, 0.114410400390625, 0.1251220703125, 0.135833740234375, 0.14654541015625, 0.157257080078125, 0.16796875, 0.178680419921875, 0.18939208984375, 0.200103759765625, 0.2108154296875, 0.221527099609375, 0.23223876953125, 0.242950439453125, 0.253662109375, 0.264373779296875, 0.27508544921875, 0.285797119140625, 0.2965087890625, 0.307220458984375, 0.31793212890625, 0.328643798828125, 0.33935546875, 0.350067138671875, 0.36077880859375, 0.371490478515625, 0.3822021484375, 0.392913818359375, 0.40362548828125, 0.414337158203125, 0.425048828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 5.0, 7.0, 11.0, 9.0, 27.0, 61.0, 107.0, 142.0, 178.0, 171.0, 115.0, 62.0, 38.0, 20.0, 15.0, 6.0, 7.0, 2.0, 3.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1136474609375, -0.10819244384765625, -0.1027374267578125, -0.09728240966796875, -0.091827392578125, -0.08637237548828125, -0.0809173583984375, -0.07546234130859375, -0.07000732421875, -0.06455230712890625, -0.0590972900390625, -0.05364227294921875, -0.048187255859375, -0.04273223876953125, -0.0372772216796875, -0.03182220458984375, -0.0263671875, -0.02091217041015625, -0.0154571533203125, -0.01000213623046875, -0.004547119140625, 0.00090789794921875, 0.0063629150390625, 0.01181793212890625, 0.01727294921875, 0.02272796630859375, 0.0281829833984375, 0.03363800048828125, 0.039093017578125, 0.04454803466796875, 0.0500030517578125, 0.05545806884765625, 0.0609130859375, 0.06636810302734375, 0.0718231201171875, 0.07727813720703125, 0.082733154296875, 0.08818817138671875, 0.0936431884765625, 0.09909820556640625, 0.10455322265625, 0.11000823974609375, 0.1154632568359375, 0.12091827392578125, 0.126373291015625, 0.13182830810546875, 0.1372833251953125, 0.14273834228515625, 0.148193359375, 0.15364837646484375, 0.1591033935546875, 0.16455841064453125, 0.170013427734375, 0.17546844482421875, 0.1809234619140625, 0.18637847900390625, 0.19183349609375, 0.19728851318359375, 0.2027435302734375, 0.20819854736328125, 0.213653564453125, 0.21910858154296875, 0.2245635986328125, 0.23001861572265625, 0.2354736328125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 20.0, 136.0, 645.0, 179.0, 22.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.646785736083984, -9.466341018676758, -9.285895347595215, -9.105450630187988, -8.925005912780762, -8.744560241699219, -8.564115524291992, -8.383670806884766, -8.203225135803223, -8.022780418395996, -7.842335224151611, -7.661890029907227, -7.481444835662842, -7.300999641418457, -7.1205549240112305, -6.940109729766846, -6.759665012359619, -6.579219818115234, -6.398775100708008, -6.218329906463623, -6.037884712219238, -5.857439994812012, -5.676994800567627, -5.496549606323242, -5.316104888916016, -5.135659694671631, -4.955214977264404, -4.7747697830200195, -4.594324588775635, -4.41387939453125, -4.233434677124023, -4.052989482879639, -3.872544765472412, -3.6920998096466064, -3.5116546154022217, -3.331209659576416, -3.1507644653320312, -2.9703195095062256, -2.78987455368042, -2.609429359436035, -2.4289841651916504, -2.2485392093658447, -2.06809401512146, -1.8876490592956543, -1.707203984260559, -1.5267589092254639, -1.3463139533996582, -1.165868878364563, -0.9854239225387573, -0.8049788475036621, -0.6245338320732117, -0.44408881664276123, -0.263643741607666, -0.0831986665725708, 0.09724628925323486, 0.2776913642883301, 0.4581364393234253, 0.6385815143585205, 0.819026529788971, 0.9994715452194214, 1.1799166202545166, 1.3603616952896118, 1.5408066511154175, 1.7212517261505127, 1.901696801185608]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 10.0, 13.0, 11.0, 10.0, 19.0, 24.0, 16.0, 24.0, 29.0, 38.0, 41.0, 44.0, 57.0, 48.0, 57.0, 67.0, 64.0, 54.0, 49.0, 48.0, 41.0, 46.0, 18.0, 37.0, 37.0, 18.0, 13.0, 19.0, 8.0, 12.0, 13.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5172576904296875, -1.4781373739242554, -1.4390170574188232, -1.3998967409133911, -1.360776424407959, -1.3216559886932373, -1.2825356721878052, -1.243415355682373, -1.204295039176941, -1.1651747226715088, -1.1260544061660767, -1.0869340896606445, -1.0478136539459229, -1.0086933374404907, -0.9695730209350586, -0.9304527044296265, -0.8913323879241943, -0.8522120714187622, -0.8130917549133301, -0.7739713788032532, -0.734851062297821, -0.6957307457923889, -0.656610369682312, -0.6174900531768799, -0.5783697366714478, -0.5392494201660156, -0.5001291036605835, -0.4610087275505066, -0.42188841104507446, -0.38276809453964233, -0.3436477482318878, -0.3045274019241333, -0.26540714502334595, -0.22628681361675262, -0.1871664822101593, -0.14804615080356598, -0.10892581939697266, -0.06980548799037933, -0.03068515658378601, 0.008435189723968506, 0.047555506229400635, 0.08667583763599396, 0.12579616904258728, 0.1649165004491806, 0.20403683185577393, 0.24315716326236725, 0.28227749466896057, 0.3213978409767151, 0.3605181574821472, 0.39963847398757935, 0.43875882029533386, 0.4778791666030884, 0.5169994831085205, 0.5561197996139526, 0.5952401161193848, 0.6343604922294617, 0.6734808087348938, 0.7126011252403259, 0.7517215013504028, 0.790841817855835, 0.8299621343612671, 0.8690824508666992, 0.9082027673721313, 0.9473231434822083, 0.9864434599876404]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 13.0, 30.0, 127.0, 590.0, 4489.0, 80867.0, 4069151.0, 34900.0, 2656.0, 531.0, 213.0, 131.0, 105.0, 87.0, 52.0, 56.0, 41.0, 33.0, 32.0, 25.0, 23.0, 21.0, 17.0, 15.0, 9.0, 12.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 6.0, 7.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.469970703125, -0.4247856140136719, -0.37960052490234375, -0.3344154357910156, -0.2892303466796875, -0.24404525756835938, -0.19886016845703125, -0.15367507934570312, -0.108489990234375, -0.06330490112304688, -0.01811981201171875, 0.027065277099609375, 0.0722503662109375, 0.11743545532226562, 0.16262054443359375, 0.20780563354492188, 0.25299072265625, 0.2981758117675781, 0.34336090087890625, 0.3885459899902344, 0.4337310791015625, 0.4789161682128906, 0.5241012573242188, 0.5692863464355469, 0.614471435546875, 0.6596565246582031, 0.7048416137695312, 0.7500267028808594, 0.7952117919921875, 0.8403968811035156, 0.8855819702148438, 0.9307670593261719, 0.9759521484375, 1.0211372375488281, 1.0663223266601562, 1.1115074157714844, 1.1566925048828125, 1.2018775939941406, 1.2470626831054688, 1.2922477722167969, 1.337432861328125, 1.3826179504394531, 1.4278030395507812, 1.4729881286621094, 1.5181732177734375, 1.5633583068847656, 1.6085433959960938, 1.6537284851074219, 1.69891357421875, 1.7440986633300781, 1.7892837524414062, 1.8344688415527344, 1.8796539306640625, 1.9248390197753906, 1.9700241088867188, 2.015209197998047, 2.060394287109375, 2.105579376220703, 2.1507644653320312, 2.1959495544433594, 2.2411346435546875, 2.2863197326660156, 2.3315048217773438, 2.376689910888672, 2.421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 12.0, 28.0, 75.0, 149.0, 219.0, 222.0, 178.0, 79.0, 36.0, 16.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039459228515625, -0.03395223617553711, -0.02844524383544922, -0.022938251495361328, -0.017431259155273438, -0.011924266815185547, -0.006417274475097656, -0.0009102821350097656, 0.004596710205078125, 0.010103702545166016, 0.015610694885253906, 0.021117687225341797, 0.026624679565429688, 0.03213167190551758, 0.03763866424560547, 0.04314565658569336, 0.04865264892578125, 0.05415964126586914, 0.05966663360595703, 0.06517362594604492, 0.07068061828613281, 0.0761876106262207, 0.0816946029663086, 0.08720159530639648, 0.09270858764648438, 0.09821557998657227, 0.10372257232666016, 0.10922956466674805, 0.11473655700683594, 0.12024354934692383, 0.12575054168701172, 0.1312575340270996, 0.1367645263671875, 0.1422715187072754, 0.14777851104736328, 0.15328550338745117, 0.15879249572753906, 0.16429948806762695, 0.16980648040771484, 0.17531347274780273, 0.18082046508789062, 0.18632745742797852, 0.1918344497680664, 0.1973414421081543, 0.2028484344482422, 0.20835542678833008, 0.21386241912841797, 0.21936941146850586, 0.22487640380859375, 0.23038339614868164, 0.23589038848876953, 0.24139738082885742, 0.2469043731689453, 0.2524113655090332, 0.2579183578491211, 0.263425350189209, 0.2689323425292969, 0.27443933486938477, 0.27994632720947266, 0.28545331954956055, 0.29096031188964844, 0.29646730422973633, 0.3019742965698242, 0.3074812889099121, 0.31298828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 9.0, 21.0, 43.0, 60.0, 92.0, 334.0, 1901.0, 4156803.0, 32916.0, 1447.0, 320.0, 128.0, 73.0, 58.0, 25.0, 17.0, 15.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2578125, -2.131103515625, -2.00439453125, -1.877685546875, -1.7509765625, -1.624267578125, -1.49755859375, -1.370849609375, -1.244140625, -1.117431640625, -0.99072265625, -0.864013671875, -0.7373046875, -0.610595703125, -0.48388671875, -0.357177734375, -0.23046875, -0.103759765625, 0.02294921875, 0.149658203125, 0.2763671875, 0.403076171875, 0.52978515625, 0.656494140625, 0.783203125, 0.909912109375, 1.03662109375, 1.163330078125, 1.2900390625, 1.416748046875, 1.54345703125, 1.670166015625, 1.796875, 1.923583984375, 2.05029296875, 2.177001953125, 2.3037109375, 2.430419921875, 2.55712890625, 2.683837890625, 2.810546875, 2.937255859375, 3.06396484375, 3.190673828125, 3.3173828125, 3.444091796875, 3.57080078125, 3.697509765625, 3.82421875, 3.950927734375, 4.07763671875, 4.204345703125, 4.3310546875, 4.457763671875, 4.58447265625, 4.711181640625, 4.837890625, 4.964599609375, 5.09130859375, 5.218017578125, 5.3447265625, 5.471435546875, 5.59814453125, 5.724853515625, 5.8515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 5.0, 12.0, 27.0, 77.0, 908.0, 2894.0, 106.0, 26.0, 14.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.086669921875, -0.07242202758789062, -0.05817413330078125, -0.043926239013671875, -0.0296783447265625, -0.015430450439453125, -0.00118255615234375, 0.013065338134765625, 0.027313232421875, 0.041561126708984375, 0.05580902099609375, 0.07005691528320312, 0.0843048095703125, 0.09855270385742188, 0.11280059814453125, 0.12704849243164062, 0.14129638671875, 0.15554428100585938, 0.16979217529296875, 0.18404006958007812, 0.1982879638671875, 0.21253585815429688, 0.22678375244140625, 0.24103164672851562, 0.255279541015625, 0.2695274353027344, 0.28377532958984375, 0.2980232238769531, 0.3122711181640625, 0.3265190124511719, 0.34076690673828125, 0.3550148010253906, 0.3692626953125, 0.3835105895996094, 0.39775848388671875, 0.4120063781738281, 0.4262542724609375, 0.4405021667480469, 0.45475006103515625, 0.4689979553222656, 0.483245849609375, 0.4974937438964844, 0.5117416381835938, 0.5259895324707031, 0.5402374267578125, 0.5544853210449219, 0.5687332153320312, 0.5829811096191406, 0.59722900390625, 0.6114768981933594, 0.6257247924804688, 0.6399726867675781, 0.6542205810546875, 0.6684684753417969, 0.6827163696289062, 0.6969642639160156, 0.711212158203125, 0.7254600524902344, 0.7397079467773438, 0.7539558410644531, 0.7682037353515625, 0.7824516296386719, 0.7966995239257812, 0.8109474182128906, 0.8251953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 19.0, 57.0, 356.0, 445.0, 80.0, 21.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3457646369934082, -1.2343119382858276, -1.122859239578247, -1.011406421661377, -0.8999537229537964, -0.7885010242462158, -0.6770482659339905, -0.5655955076217651, -0.45414280891418457, -0.3426900804042816, -0.23123735189437866, -0.11978462338447571, -0.008331894874572754, 0.10312080383300781, 0.21457356214523315, 0.3260263204574585, 0.43747901916503906, 0.5489317178726196, 0.660384476184845, 0.7718372344970703, 0.8832899332046509, 0.9947426319122314, 1.1061954498291016, 1.2176481485366821, 1.3291008472442627, 1.4405535459518433, 1.5520062446594238, 1.663459062576294, 1.7749117612838745, 1.886364459991455, 1.9978172779083252, 2.1092700958251953, 2.2207226753234863, 2.3321754932403564, 2.4436280727386475, 2.5550808906555176, 2.6665334701538086, 2.7779862880706787, 2.889439105987549, 3.00089168548584, 3.11234450340271, 3.22379732131958, 3.335249900817871, 3.446702718734741, 3.5581555366516113, 3.6696081161499023, 3.7810609340667725, 3.8925137519836426, 4.003966331481934, 4.115418910980225, 4.226871967315674, 4.338324546813965, 4.449777126312256, 4.561229705810547, 4.672682762145996, 4.784135341644287, 4.895587921142578, 5.007040500640869, 5.118493556976318, 5.229946136474609, 5.3413987159729, 5.452851295471191, 5.564304351806641, 5.675756931304932, 5.787209987640381]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 9.0, 12.0, 30.0, 29.0, 62.0, 84.0, 117.0, 109.0, 134.0, 124.0, 104.0, 77.0, 49.0, 27.0, 11.0, 11.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.885972499847412, -1.822251796722412, -1.758531093597412, -1.6948102712631226, -1.6310895681381226, -1.5673688650131226, -1.503648042678833, -1.439927339553833, -1.376206636428833, -1.312485933303833, -1.248765230178833, -1.1850444078445435, -1.1213237047195435, -1.0576030015945435, -0.9938822388648987, -0.9301614761352539, -0.8664407730102539, -0.8027200698852539, -0.7389993071556091, -0.6752785444259644, -0.6115578413009644, -0.5478371381759644, -0.4841163754463196, -0.4203956425189972, -0.3566749095916748, -0.2929541766643524, -0.22923344373703003, -0.16551271080970764, -0.10179197788238525, -0.038071244955062866, 0.02564948797225952, 0.08937022089958191, 0.1530909538269043, 0.21681168675422668, 0.2805324196815491, 0.34425315260887146, 0.40797388553619385, 0.47169461846351624, 0.5354153513908386, 0.5991361141204834, 0.6628568172454834, 0.7265775203704834, 0.7902982831001282, 0.854019045829773, 0.917739748954773, 0.981460452079773, 1.0451812744140625, 1.1089019775390625, 1.1726226806640625, 1.2363433837890625, 1.3000640869140625, 1.363784909248352, 1.427505612373352, 1.491226315498352, 1.5549471378326416, 1.6186678409576416, 1.6823885440826416, 1.7461092472076416, 1.8098299503326416, 1.8735507726669312, 1.9372714757919312, 2.0009922981262207, 2.0647130012512207, 2.1284337043762207, 2.1921544075012207]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 9.0, 10.0, 19.0, 26.0, 40.0, 53.0, 109.0, 228.0, 632.0, 2974.0, 40951.0, 954392.0, 44687.0, 3194.0, 636.0, 249.0, 103.0, 73.0, 41.0, 36.0, 19.0, 16.0, 10.0, 7.0, 8.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.0378875732421875, -0.993743896484375, -0.9496002197265625, -0.90545654296875, -0.8613128662109375, -0.817169189453125, -0.7730255126953125, -0.7288818359375, -0.6847381591796875, -0.640594482421875, -0.5964508056640625, -0.55230712890625, -0.5081634521484375, -0.464019775390625, -0.4198760986328125, -0.375732421875, -0.3315887451171875, -0.287445068359375, -0.2433013916015625, -0.19915771484375, -0.1550140380859375, -0.110870361328125, -0.0667266845703125, -0.0225830078125, 0.0215606689453125, 0.065704345703125, 0.1098480224609375, 0.15399169921875, 0.1981353759765625, 0.242279052734375, 0.2864227294921875, 0.33056640625, 0.3747100830078125, 0.418853759765625, 0.4629974365234375, 0.50714111328125, 0.5512847900390625, 0.595428466796875, 0.6395721435546875, 0.6837158203125, 0.7278594970703125, 0.772003173828125, 0.8161468505859375, 0.86029052734375, 0.9044342041015625, 0.948577880859375, 0.9927215576171875, 1.036865234375, 1.0810089111328125, 1.125152587890625, 1.1692962646484375, 1.21343994140625, 1.2575836181640625, 1.301727294921875, 1.3458709716796875, 1.3900146484375, 1.4341583251953125, 1.478302001953125, 1.5224456787109375, 1.56658935546875, 1.6107330322265625, 1.654876708984375, 1.6990203857421875, 1.7431640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 18.0, 37.0, 65.0, 123.0, 158.0, 184.0, 175.0, 110.0, 72.0, 41.0, 13.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11322021484375, -0.10639286041259766, -0.09956550598144531, -0.09273815155029297, -0.08591079711914062, -0.07908344268798828, -0.07225608825683594, -0.0654287338256836, -0.05860137939453125, -0.051774024963378906, -0.04494667053222656, -0.03811931610107422, -0.031291961669921875, -0.02446460723876953, -0.017637252807617188, -0.010809898376464844, -0.0039825439453125, 0.0028448104858398438, 0.009672164916992188, 0.01649951934814453, 0.023326873779296875, 0.03015422821044922, 0.03698158264160156, 0.043808937072753906, 0.05063629150390625, 0.057463645935058594, 0.06429100036621094, 0.07111835479736328, 0.07794570922851562, 0.08477306365966797, 0.09160041809082031, 0.09842777252197266, 0.105255126953125, 0.11208248138427734, 0.11890983581542969, 0.12573719024658203, 0.13256454467773438, 0.13939189910888672, 0.14621925354003906, 0.1530466079711914, 0.15987396240234375, 0.1667013168334961, 0.17352867126464844, 0.18035602569580078, 0.18718338012695312, 0.19401073455810547, 0.2008380889892578, 0.20766544342041016, 0.2144927978515625, 0.22132015228271484, 0.2281475067138672, 0.23497486114501953, 0.24180221557617188, 0.24862957000732422, 0.25545692443847656, 0.2622842788696289, 0.26911163330078125, 0.2759389877319336, 0.28276634216308594, 0.2895936965942383, 0.2964210510253906, 0.30324840545654297, 0.3100757598876953, 0.31690311431884766, 0.32373046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 6.0, 11.0, 14.0, 8.0, 19.0, 20.0, 28.0, 36.0, 56.0, 65.0, 95.0, 170.0, 315.0, 496.0, 968.0, 2170.0, 5623.0, 19488.0, 114126.0, 711974.0, 156845.0, 24687.0, 6451.0, 2372.0, 1061.0, 553.0, 319.0, 174.0, 114.0, 67.0, 68.0, 32.0, 28.0, 16.0, 18.0, 8.0, 12.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.449951171875, -0.435699462890625, -0.42144775390625, -0.407196044921875, -0.3929443359375, -0.378692626953125, -0.36444091796875, -0.350189208984375, -0.3359375, -0.321685791015625, -0.30743408203125, -0.293182373046875, -0.2789306640625, -0.264678955078125, -0.25042724609375, -0.236175537109375, -0.221923828125, -0.207672119140625, -0.19342041015625, -0.179168701171875, -0.1649169921875, -0.150665283203125, -0.13641357421875, -0.122161865234375, -0.10791015625, -0.093658447265625, -0.07940673828125, -0.065155029296875, -0.0509033203125, -0.036651611328125, -0.02239990234375, -0.008148193359375, 0.006103515625, 0.020355224609375, 0.03460693359375, 0.048858642578125, 0.0631103515625, 0.077362060546875, 0.09161376953125, 0.105865478515625, 0.1201171875, 0.134368896484375, 0.14862060546875, 0.162872314453125, 0.1771240234375, 0.191375732421875, 0.20562744140625, 0.219879150390625, 0.234130859375, 0.248382568359375, 0.26263427734375, 0.276885986328125, 0.2911376953125, 0.305389404296875, 0.31964111328125, 0.333892822265625, 0.34814453125, 0.362396240234375, 0.37664794921875, 0.390899658203125, 0.4051513671875, 0.419403076171875, 0.43365478515625, 0.447906494140625, 0.462158203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 17.0, 14.0, 20.0, 20.0, 35.0, 36.0, 40.0, 42.0, 63.0, 64.0, 64.0, 63.0, 70.0, 65.0, 69.0, 51.0, 46.0, 43.0, 38.0, 22.0, 26.0, 21.0, 18.0, 6.0, 8.0, 4.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.376220703125, -0.36444854736328125, -0.3526763916015625, -0.34090423583984375, -0.329132080078125, -0.31735992431640625, -0.3055877685546875, -0.29381561279296875, -0.28204345703125, -0.27027130126953125, -0.2584991455078125, -0.24672698974609375, -0.234954833984375, -0.22318267822265625, -0.2114105224609375, -0.19963836669921875, -0.1878662109375, -0.17609405517578125, -0.1643218994140625, -0.15254974365234375, -0.140777587890625, -0.12900543212890625, -0.1172332763671875, -0.10546112060546875, -0.09368896484375, -0.08191680908203125, -0.0701446533203125, -0.05837249755859375, -0.046600341796875, -0.03482818603515625, -0.0230560302734375, -0.01128387451171875, 0.00048828125, 0.01226043701171875, 0.0240325927734375, 0.03580474853515625, 0.047576904296875, 0.05934906005859375, 0.0711212158203125, 0.08289337158203125, 0.09466552734375, 0.10643768310546875, 0.1182098388671875, 0.12998199462890625, 0.141754150390625, 0.15352630615234375, 0.1652984619140625, 0.17707061767578125, 0.1888427734375, 0.20061492919921875, 0.2123870849609375, 0.22415924072265625, 0.235931396484375, 0.24770355224609375, 0.2594757080078125, 0.27124786376953125, 0.28302001953125, 0.29479217529296875, 0.3065643310546875, 0.31833648681640625, 0.330108642578125, 0.34188079833984375, 0.3536529541015625, 0.36542510986328125, 0.377197265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 17.0, 15.0, 16.0, 20.0, 34.0, 63.0, 90.0, 162.0, 234.0, 505.0, 1164.0, 3032.0, 8804.0, 35771.0, 296613.0, 597271.0, 81599.0, 15035.0, 4695.0, 1705.0, 772.0, 367.0, 198.0, 97.0, 66.0, 50.0, 41.0, 14.0, 22.0, 11.0, 10.0, 9.0, 10.0, 9.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1551513671875, -0.15033531188964844, -0.14551925659179688, -0.1407032012939453, -0.13588714599609375, -0.1310710906982422, -0.12625503540039062, -0.12143898010253906, -0.1166229248046875, -0.11180686950683594, -0.10699081420898438, -0.10217475891113281, -0.09735870361328125, -0.09254264831542969, -0.08772659301757812, -0.08291053771972656, -0.078094482421875, -0.07327842712402344, -0.06846237182617188, -0.06364631652832031, -0.05883026123046875, -0.05401420593261719, -0.049198150634765625, -0.04438209533691406, -0.0395660400390625, -0.03474998474121094, -0.029933929443359375, -0.025117874145507812, -0.02030181884765625, -0.015485763549804688, -0.010669708251953125, -0.0058536529541015625, -0.00103759765625, 0.0037784576416015625, 0.008594512939453125, 0.013410568237304688, 0.01822662353515625, 0.023042678833007812, 0.027858734130859375, 0.03267478942871094, 0.0374908447265625, 0.04230690002441406, 0.047122955322265625, 0.05193901062011719, 0.05675506591796875, 0.06157112121582031, 0.06638717651367188, 0.07120323181152344, 0.076019287109375, 0.08083534240722656, 0.08565139770507812, 0.09046745300292969, 0.09528350830078125, 0.10009956359863281, 0.10491561889648438, 0.10973167419433594, 0.1145477294921875, 0.11936378479003906, 0.12417984008789062, 0.1289958953857422, 0.13381195068359375, 0.1386280059814453, 0.14344406127929688, 0.14826011657714844, 0.153076171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 18.0, 14.0, 17.0, 26.0, 32.0, 55.0, 32.0, 51.0, 74.0, 82.0, 91.0, 105.0, 64.0, 67.0, 53.0, 43.0, 38.0, 26.0, 26.0, 19.0, 14.0, 13.0, 10.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00016570091247558594, -0.00016160588711500168, -0.00015751086175441742, -0.00015341583639383316, -0.0001493208110332489, -0.00014522578567266464, -0.00014113076031208038, -0.00013703573495149612, -0.00013294070959091187, -0.0001288456842303276, -0.00012475065886974335, -0.00012065563350915909, -0.00011656060814857483, -0.00011246558278799057, -0.00010837055742740631, -0.00010427553206682205, -0.00010018050670623779, -9.608548134565353e-05, -9.199045598506927e-05, -8.789543062448502e-05, -8.380040526390076e-05, -7.97053799033165e-05, -7.561035454273224e-05, -7.151532918214798e-05, -6.742030382156372e-05, -6.332527846097946e-05, -5.92302531003952e-05, -5.5135227739810944e-05, -5.1040202379226685e-05, -4.6945177018642426e-05, -4.2850151658058167e-05, -3.875512629747391e-05, -3.466010093688965e-05, -3.056507557630539e-05, -2.647005021572113e-05, -2.237502485513687e-05, -1.8279999494552612e-05, -1.4184974133968353e-05, -1.0089948773384094e-05, -5.994923412799835e-06, -1.8998980522155762e-06, 2.195127308368683e-06, 6.290152668952942e-06, 1.0385178029537201e-05, 1.448020339012146e-05, 1.857522875070572e-05, 2.2670254111289978e-05, 2.6765279471874237e-05, 3.0860304832458496e-05, 3.4955330193042755e-05, 3.9050355553627014e-05, 4.314538091421127e-05, 4.724040627479553e-05, 5.133543163537979e-05, 5.543045699596405e-05, 5.952548235654831e-05, 6.362050771713257e-05, 6.771553307771683e-05, 7.181055843830109e-05, 7.590558379888535e-05, 8.00006091594696e-05, 8.409563452005386e-05, 8.819065988063812e-05, 9.228568524122238e-05, 9.638071060180664e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 6.0, 3.0, 17.0, 18.0, 25.0, 34.0, 63.0, 75.0, 162.0, 313.0, 711.0, 1804.0, 5311.0, 21146.0, 230386.0, 704729.0, 67817.0, 10672.0, 3090.0, 1160.0, 458.0, 209.0, 140.0, 80.0, 47.0, 25.0, 9.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.1578693389892578, -0.15228652954101562, -0.14670372009277344, -0.14112091064453125, -0.13553810119628906, -0.12995529174804688, -0.12437248229980469, -0.1187896728515625, -0.11320686340332031, -0.10762405395507812, -0.10204124450683594, -0.09645843505859375, -0.09087562561035156, -0.08529281616210938, -0.07971000671386719, -0.074127197265625, -0.06854438781738281, -0.06296157836914062, -0.05737876892089844, -0.05179595947265625, -0.04621315002441406, -0.040630340576171875, -0.03504753112792969, -0.0294647216796875, -0.023881912231445312, -0.018299102783203125, -0.012716293334960938, -0.00713348388671875, -0.0015506744384765625, 0.004032135009765625, 0.009614944458007812, 0.01519775390625, 0.020780563354492188, 0.026363372802734375, 0.03194618225097656, 0.03752899169921875, 0.04311180114746094, 0.048694610595703125, 0.05427742004394531, 0.0598602294921875, 0.06544303894042969, 0.07102584838867188, 0.07660865783691406, 0.08219146728515625, 0.08777427673339844, 0.09335708618164062, 0.09893989562988281, 0.104522705078125, 0.11010551452636719, 0.11568832397460938, 0.12127113342285156, 0.12685394287109375, 0.13243675231933594, 0.13801956176757812, 0.1436023712158203, 0.1491851806640625, 0.1547679901123047, 0.16035079956054688, 0.16593360900878906, 0.17151641845703125, 0.17709922790527344, 0.18268203735351562, 0.1882648468017578, 0.19384765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 7.0, 5.0, 11.0, 15.0, 29.0, 35.0, 58.0, 108.0, 138.0, 147.0, 130.0, 108.0, 80.0, 57.0, 25.0, 18.0, 12.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09002685546875, -0.08619022369384766, -0.08235359191894531, -0.07851696014404297, -0.07468032836914062, -0.07084369659423828, -0.06700706481933594, -0.0631704330444336, -0.05933380126953125, -0.055497169494628906, -0.05166053771972656, -0.04782390594482422, -0.043987274169921875, -0.04015064239501953, -0.03631401062011719, -0.032477378845214844, -0.0286407470703125, -0.024804115295410156, -0.020967483520507812, -0.01713085174560547, -0.013294219970703125, -0.009457588195800781, -0.0056209564208984375, -0.0017843246459960938, 0.00205230712890625, 0.005888938903808594, 0.009725570678710938, 0.013562202453613281, 0.017398834228515625, 0.02123546600341797, 0.025072097778320312, 0.028908729553222656, 0.032745361328125, 0.036581993103027344, 0.04041862487792969, 0.04425525665283203, 0.048091888427734375, 0.05192852020263672, 0.05576515197753906, 0.059601783752441406, 0.06343841552734375, 0.0672750473022461, 0.07111167907714844, 0.07494831085205078, 0.07878494262695312, 0.08262157440185547, 0.08645820617675781, 0.09029483795166016, 0.0941314697265625, 0.09796810150146484, 0.10180473327636719, 0.10564136505126953, 0.10947799682617188, 0.11331462860107422, 0.11715126037597656, 0.1209878921508789, 0.12482452392578125, 0.1286611557006836, 0.13249778747558594, 0.13633441925048828, 0.14017105102539062, 0.14400768280029297, 0.1478443145751953, 0.15168094635009766, 0.155517578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 8.0, 7.0, 25.0, 77.0, 189.0, 383.0, 218.0, 59.0, 26.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.911895275115967, -2.7886033058166504, -2.665311336517334, -2.5420193672180176, -2.4187276363372803, -2.295435667037964, -2.1721436977386475, -2.048851728439331, -1.9255597591400146, -1.8022677898406982, -1.6789759397506714, -1.555683970451355, -1.4323920011520386, -1.3091001510620117, -1.1858081817626953, -1.062516212463379, -0.939224362373352, -0.8159324526786804, -0.692640483379364, -0.5693485736846924, -0.44605663418769836, -0.32276469469070435, -0.19947278499603271, -0.07618081569671631, 0.04711109399795532, 0.17040303349494934, 0.29369497299194336, 0.416986882686615, 0.5402787923812866, 0.663570761680603, 0.7868626713752747, 0.9101546406745911, 1.0334465503692627, 1.156738519668579, 1.280030369758606, 1.4033223390579224, 1.5266143083572388, 1.6499061584472656, 1.773198127746582, 1.8964900970458984, 2.019782066345215, 2.1430740356445312, 2.2663660049438477, 2.389657974243164, 2.5129497051239014, 2.6362416744232178, 2.759533643722534, 2.8828256130218506, 3.006117343902588, 3.1294093132019043, 3.2527012825012207, 3.375993251800537, 3.4992849826812744, 3.622576951980591, 3.7458689212799072, 3.8691608905792236, 3.99245285987854, 4.115744590759277, 4.239036560058594, 4.36232852935791, 4.485620498657227, 4.608912467956543, 4.732204437255859, 4.855496406555176, 4.978788375854492]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 7.0, 8.0, 6.0, 16.0, 19.0, 17.0, 15.0, 29.0, 29.0, 35.0, 39.0, 39.0, 51.0, 43.0, 53.0, 42.0, 74.0, 54.0, 46.0, 50.0, 54.0, 40.0, 37.0, 27.0, 33.0, 30.0, 29.0, 18.0, 11.0, 10.0, 13.0, 11.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4132628440856934, -1.359816074371338, -1.3063693046569824, -1.252922534942627, -1.199475884437561, -1.1460291147232056, -1.09258234500885, -1.0391355752944946, -0.9856888055801392, -0.9322420358657837, -0.878795325756073, -0.8253485560417175, -0.7719017863273621, -0.7184550762176514, -0.6650083065032959, -0.6115615367889404, -0.5581148266792297, -0.5046680569648743, -0.4512213170528412, -0.3977745771408081, -0.34432780742645264, -0.29088106751441956, -0.23743432760238647, -0.183987557888031, -0.13054081797599792, -0.07709406316280365, -0.023647315800189972, 0.029799431562423706, 0.08324618637561798, 0.13669294118881226, 0.19013968110084534, 0.2435864508152008, 0.2970331907272339, 0.35047993063926697, 0.40392670035362244, 0.4573734402656555, 0.510820209980011, 0.5642669200897217, 0.6177136898040771, 0.6711604595184326, 0.7246072292327881, 0.7780539989471436, 0.8315007090568542, 0.8849474787712097, 0.9383942484855652, 0.9918409585952759, 1.0452877283096313, 1.0987344980239868, 1.1521811485290527, 1.2056279182434082, 1.2590746879577637, 1.3125214576721191, 1.365968108177185, 1.4194148778915405, 1.472861647605896, 1.5263084173202515, 1.579755187034607, 1.6332019567489624, 1.6866487264633179, 1.7400953769683838, 1.7935421466827393, 1.8469889163970947, 1.9004356861114502, 1.9538824558258057, 2.007329225540161]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 4.0, 19.0, 19.0, 27.0, 75.0, 146.0, 375.0, 923.0, 3046.0, 15142.0, 243294.0, 3888614.0, 34492.0, 5147.0, 1379.0, 591.0, 285.0, 181.0, 120.0, 90.0, 70.0, 41.0, 36.0, 23.0, 16.0, 24.0, 15.0, 16.0, 12.0, 12.0, 8.0, 3.0, 9.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.465087890625, -0.4345054626464844, -0.40392303466796875, -0.3733406066894531, -0.3427581787109375, -0.3121757507324219, -0.28159332275390625, -0.2510108947753906, -0.220428466796875, -0.18984603881835938, -0.15926361083984375, -0.12868118286132812, -0.0980987548828125, -0.06751632690429688, -0.03693389892578125, -0.006351470947265625, 0.02423095703125, 0.054813385009765625, 0.08539581298828125, 0.11597824096679688, 0.1465606689453125, 0.17714309692382812, 0.20772552490234375, 0.23830795288085938, 0.268890380859375, 0.2994728088378906, 0.33005523681640625, 0.3606376647949219, 0.3912200927734375, 0.4218025207519531, 0.45238494873046875, 0.4829673767089844, 0.5135498046875, 0.5441322326660156, 0.5747146606445312, 0.6052970886230469, 0.6358795166015625, 0.6664619445800781, 0.6970443725585938, 0.7276268005371094, 0.758209228515625, 0.7887916564941406, 0.8193740844726562, 0.8499565124511719, 0.8805389404296875, 0.9111213684082031, 0.9417037963867188, 0.9722862243652344, 1.00286865234375, 1.0334510803222656, 1.0640335083007812, 1.0946159362792969, 1.1251983642578125, 1.1557807922363281, 1.1863632202148438, 1.2169456481933594, 1.247528076171875, 1.2781105041503906, 1.3086929321289062, 1.3392753601074219, 1.3698577880859375, 1.4004402160644531, 1.4310226440429688, 1.4616050720214844, 1.4921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 21.0, 37.0, 60.0, 125.0, 139.0, 168.0, 164.0, 128.0, 77.0, 48.0, 20.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083251953125, -0.07669448852539062, -0.07013702392578125, -0.06357955932617188, -0.0570220947265625, -0.050464630126953125, -0.04390716552734375, -0.037349700927734375, -0.030792236328125, -0.024234771728515625, -0.01767730712890625, -0.011119842529296875, -0.0045623779296875, 0.001995086669921875, 0.00855255126953125, 0.015110015869140625, 0.02166748046875, 0.028224945068359375, 0.03478240966796875, 0.041339874267578125, 0.0478973388671875, 0.054454803466796875, 0.06101226806640625, 0.06756973266601562, 0.074127197265625, 0.08068466186523438, 0.08724212646484375, 0.09379959106445312, 0.1003570556640625, 0.10691452026367188, 0.11347198486328125, 0.12002944946289062, 0.1265869140625, 0.13314437866210938, 0.13970184326171875, 0.14625930786132812, 0.1528167724609375, 0.15937423706054688, 0.16593170166015625, 0.17248916625976562, 0.179046630859375, 0.18560409545898438, 0.19216156005859375, 0.19871902465820312, 0.2052764892578125, 0.21183395385742188, 0.21839141845703125, 0.22494888305664062, 0.23150634765625, 0.23806381225585938, 0.24462127685546875, 0.2511787414550781, 0.2577362060546875, 0.2642936706542969, 0.27085113525390625, 0.2774085998535156, 0.283966064453125, 0.2905235290527344, 0.29708099365234375, 0.3036384582519531, 0.3101959228515625, 0.3167533874511719, 0.32331085205078125, 0.3298683166503906, 0.33642578125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 17.0, 28.0, 37.0, 85.0, 141.0, 307.0, 629.0, 2103.0, 19959.0, 4148945.0, 18391.0, 2170.0, 752.0, 355.0, 159.0, 89.0, 40.0, 36.0, 8.0, 11.0, 6.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4443359375, -1.395355224609375, -1.34637451171875, -1.297393798828125, -1.2484130859375, -1.199432373046875, -1.15045166015625, -1.101470947265625, -1.052490234375, -1.003509521484375, -0.95452880859375, -0.905548095703125, -0.8565673828125, -0.807586669921875, -0.75860595703125, -0.709625244140625, -0.66064453125, -0.611663818359375, -0.56268310546875, -0.513702392578125, -0.4647216796875, -0.415740966796875, -0.36676025390625, -0.317779541015625, -0.268798828125, -0.219818115234375, -0.17083740234375, -0.121856689453125, -0.0728759765625, -0.023895263671875, 0.02508544921875, 0.074066162109375, 0.123046875, 0.172027587890625, 0.22100830078125, 0.269989013671875, 0.3189697265625, 0.367950439453125, 0.41693115234375, 0.465911865234375, 0.514892578125, 0.563873291015625, 0.61285400390625, 0.661834716796875, 0.7108154296875, 0.759796142578125, 0.80877685546875, 0.857757568359375, 0.90673828125, 0.955718994140625, 1.00469970703125, 1.053680419921875, 1.1026611328125, 1.151641845703125, 1.20062255859375, 1.249603271484375, 1.298583984375, 1.347564697265625, 1.39654541015625, 1.445526123046875, 1.4945068359375, 1.543487548828125, 1.59246826171875, 1.641448974609375, 1.6904296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 8.0, 3.0, 6.0, 17.0, 54.0, 237.0, 2769.0, 794.0, 111.0, 38.0, 17.0, 11.0, 5.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.220703125, -0.2121429443359375, -0.203582763671875, -0.1950225830078125, -0.18646240234375, -0.1779022216796875, -0.169342041015625, -0.1607818603515625, -0.1522216796875, -0.1436614990234375, -0.135101318359375, -0.1265411376953125, -0.11798095703125, -0.1094207763671875, -0.100860595703125, -0.0923004150390625, -0.083740234375, -0.0751800537109375, -0.066619873046875, -0.0580596923828125, -0.04949951171875, -0.0409393310546875, -0.032379150390625, -0.0238189697265625, -0.0152587890625, -0.0066986083984375, 0.001861572265625, 0.0104217529296875, 0.01898193359375, 0.0275421142578125, 0.036102294921875, 0.0446624755859375, 0.05322265625, 0.0617828369140625, 0.070343017578125, 0.0789031982421875, 0.08746337890625, 0.0960235595703125, 0.104583740234375, 0.1131439208984375, 0.1217041015625, 0.1302642822265625, 0.138824462890625, 0.1473846435546875, 0.15594482421875, 0.1645050048828125, 0.173065185546875, 0.1816253662109375, 0.190185546875, 0.1987457275390625, 0.207305908203125, 0.2158660888671875, 0.22442626953125, 0.2329864501953125, 0.241546630859375, 0.2501068115234375, 0.2586669921875, 0.2672271728515625, 0.275787353515625, 0.2843475341796875, 0.29290771484375, 0.3014678955078125, 0.310028076171875, 0.3185882568359375, 0.3271484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 10.0, 60.0, 338.0, 464.0, 91.0, 25.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.004013776779175, -2.925145149230957, -2.8462765216827393, -2.7674078941345215, -2.6885392665863037, -2.609670639038086, -2.530802011489868, -2.4519333839416504, -2.3730649948120117, -2.294196367263794, -2.215327739715576, -2.1364591121673584, -2.0575904846191406, -1.9787218570709229, -1.8998533487319946, -1.8209847211837769, -1.7421159744262695, -1.6632473468780518, -1.584378719329834, -1.5055100917816162, -1.4266414642333984, -1.3477728366851807, -1.2689043283462524, -1.1900357007980347, -1.111167073249817, -1.0322984457015991, -0.9534298181533813, -0.8745612502098083, -0.7956926226615906, -0.7168239951133728, -0.6379554271697998, -0.559086799621582, -0.48021793365478516, -0.4013493061065674, -0.322480708360672, -0.24361209571361542, -0.16474348306655884, -0.08587485551834106, -0.007006257772445679, 0.07186233997344971, 0.15073096752166748, 0.22959958016872406, 0.30846819281578064, 0.387336790561676, 0.4662054181098938, 0.5450740456581116, 0.6239426136016846, 0.7028112411499023, 0.7816798686981201, 0.8605484962463379, 0.9394171237945557, 1.0182857513427734, 1.0971543788909912, 1.176023006439209, 1.2548915147781372, 1.333760142326355, 1.4126287698745728, 1.4914973974227905, 1.5703660249710083, 1.649234652519226, 1.7281031608581543, 1.806971788406372, 1.8858404159545898, 1.9647090435028076, 2.0435776710510254]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 11.0, 1.0, 11.0, 7.0, 18.0, 17.0, 32.0, 46.0, 48.0, 55.0, 55.0, 78.0, 66.0, 66.0, 68.0, 71.0, 62.0, 55.0, 48.0, 45.0, 40.0, 18.0, 25.0, 16.0, 15.0, 12.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6948535442352295, -0.6740829348564148, -0.6533122658729553, -0.6325416564941406, -0.6117710471153259, -0.5910004377365112, -0.5702297687530518, -0.5494591593742371, -0.5286885499954224, -0.5079179406166077, -0.4871473014354706, -0.4663766622543335, -0.4456060528755188, -0.4248354136943817, -0.40406477451324463, -0.38329416513442993, -0.36252349615097046, -0.3417528569698334, -0.3209822475910187, -0.3002116084098816, -0.2794409990310669, -0.2586703598499298, -0.23789972066879272, -0.21712909638881683, -0.19635847210884094, -0.17558784782886505, -0.15481722354888916, -0.13404658436775208, -0.11327596008777618, -0.09250533580780029, -0.0717347040772438, -0.05096407234668732, -0.030193448066711426, -0.009422820061445236, 0.011347807943820953, 0.03211843594908714, 0.05288906395435333, 0.07365968823432922, 0.09443031996488571, 0.1152009516954422, 0.1359715759754181, 0.15674220025539398, 0.17751282453536987, 0.19828346371650696, 0.21905408799648285, 0.23982471227645874, 0.2605953514575958, 0.2813659906387329, 0.3021366000175476, 0.3229072391986847, 0.3436778485774994, 0.3644484877586365, 0.38521909713745117, 0.40598973631858826, 0.42676037549972534, 0.44753098487854004, 0.4683016240596771, 0.4890722632408142, 0.5098428726196289, 0.5306134819984436, 0.5513841509819031, 0.5721547603607178, 0.5929253697395325, 0.6136960387229919, 0.6344666481018066]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 13.0, 24.0, 20.0, 39.0, 45.0, 97.0, 186.0, 422.0, 1227.0, 5814.0, 148310.0, 866920.0, 21686.0, 2471.0, 715.0, 256.0, 121.0, 54.0, 41.0, 36.0, 16.0, 13.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.56640625, -1.52545166015625, -1.4844970703125, -1.44354248046875, -1.402587890625, -1.36163330078125, -1.3206787109375, -1.27972412109375, -1.23876953125, -1.19781494140625, -1.1568603515625, -1.11590576171875, -1.074951171875, -1.03399658203125, -0.9930419921875, -0.95208740234375, -0.9111328125, -0.87017822265625, -0.8292236328125, -0.78826904296875, -0.747314453125, -0.70635986328125, -0.6654052734375, -0.62445068359375, -0.58349609375, -0.54254150390625, -0.5015869140625, -0.46063232421875, -0.419677734375, -0.37872314453125, -0.3377685546875, -0.29681396484375, -0.255859375, -0.21490478515625, -0.1739501953125, -0.13299560546875, -0.092041015625, -0.05108642578125, -0.0101318359375, 0.03082275390625, 0.07177734375, 0.11273193359375, 0.1536865234375, 0.19464111328125, 0.235595703125, 0.27655029296875, 0.3175048828125, 0.35845947265625, 0.3994140625, 0.44036865234375, 0.4813232421875, 0.52227783203125, 0.563232421875, 0.60418701171875, 0.6451416015625, 0.68609619140625, 0.72705078125, 0.76800537109375, 0.8089599609375, 0.84991455078125, 0.890869140625, 0.93182373046875, 0.9727783203125, 1.01373291015625, 1.0546875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 9.0, 16.0, 37.0, 58.0, 78.0, 121.0, 128.0, 150.0, 135.0, 108.0, 78.0, 38.0, 25.0, 11.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08734130859375, -0.08079242706298828, -0.07424354553222656, -0.06769466400146484, -0.061145782470703125, -0.054596900939941406, -0.04804801940917969, -0.04149913787841797, -0.03495025634765625, -0.02840137481689453, -0.021852493286132812, -0.015303611755371094, -0.008754730224609375, -0.0022058486938476562, 0.0043430328369140625, 0.010891914367675781, 0.0174407958984375, 0.02398967742919922, 0.030538558959960938, 0.037087440490722656, 0.043636322021484375, 0.050185203552246094, 0.05673408508300781, 0.06328296661376953, 0.06983184814453125, 0.07638072967529297, 0.08292961120605469, 0.0894784927368164, 0.09602737426757812, 0.10257625579833984, 0.10912513732910156, 0.11567401885986328, 0.122222900390625, 0.12877178192138672, 0.13532066345214844, 0.14186954498291016, 0.14841842651367188, 0.1549673080444336, 0.1615161895751953, 0.16806507110595703, 0.17461395263671875, 0.18116283416748047, 0.1877117156982422, 0.1942605972290039, 0.20080947875976562, 0.20735836029052734, 0.21390724182128906, 0.22045612335205078, 0.2270050048828125, 0.23355388641357422, 0.24010276794433594, 0.24665164947509766, 0.2532005310058594, 0.2597494125366211, 0.2662982940673828, 0.27284717559814453, 0.27939605712890625, 0.28594493865966797, 0.2924938201904297, 0.2990427017211914, 0.3055915832519531, 0.31214046478271484, 0.31868934631347656, 0.3252382278442383, 0.331787109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 2.0, 11.0, 9.0, 15.0, 25.0, 32.0, 50.0, 94.0, 185.0, 401.0, 927.0, 2265.0, 7543.0, 47571.0, 770289.0, 195701.0, 16908.0, 3930.0, 1325.0, 582.0, 291.0, 163.0, 77.0, 41.0, 32.0, 27.0, 18.0, 10.0, 7.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5313262939453125, -0.507965087890625, -0.4846038818359375, -0.46124267578125, -0.4378814697265625, -0.414520263671875, -0.3911590576171875, -0.3677978515625, -0.3444366455078125, -0.321075439453125, -0.2977142333984375, -0.27435302734375, -0.2509918212890625, -0.227630615234375, -0.2042694091796875, -0.180908203125, -0.1575469970703125, -0.134185791015625, -0.1108245849609375, -0.08746337890625, -0.0641021728515625, -0.040740966796875, -0.0173797607421875, 0.0059814453125, 0.0293426513671875, 0.052703857421875, 0.0760650634765625, 0.09942626953125, 0.1227874755859375, 0.146148681640625, 0.1695098876953125, 0.19287109375, 0.2162322998046875, 0.239593505859375, 0.2629547119140625, 0.28631591796875, 0.3096771240234375, 0.333038330078125, 0.3563995361328125, 0.3797607421875, 0.4031219482421875, 0.426483154296875, 0.4498443603515625, 0.47320556640625, 0.4965667724609375, 0.519927978515625, 0.5432891845703125, 0.566650390625, 0.5900115966796875, 0.613372802734375, 0.6367340087890625, 0.66009521484375, 0.6834564208984375, 0.706817626953125, 0.7301788330078125, 0.7535400390625, 0.7769012451171875, 0.800262451171875, 0.8236236572265625, 0.84698486328125, 0.8703460693359375, 0.893707275390625, 0.9170684814453125, 0.9404296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 14.0, 10.0, 16.0, 21.0, 36.0, 44.0, 55.0, 78.0, 84.0, 77.0, 98.0, 96.0, 71.0, 48.0, 50.0, 43.0, 40.0, 27.0, 19.0, 23.0, 10.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4638671875, -0.44628143310546875, -0.4286956787109375, -0.41110992431640625, -0.393524169921875, -0.37593841552734375, -0.3583526611328125, -0.34076690673828125, -0.32318115234375, -0.30559539794921875, -0.2880096435546875, -0.27042388916015625, -0.252838134765625, -0.23525238037109375, -0.2176666259765625, -0.20008087158203125, -0.1824951171875, -0.16490936279296875, -0.1473236083984375, -0.12973785400390625, -0.112152099609375, -0.09456634521484375, -0.0769805908203125, -0.05939483642578125, -0.04180908203125, -0.02422332763671875, -0.0066375732421875, 0.01094818115234375, 0.028533935546875, 0.04611968994140625, 0.0637054443359375, 0.08129119873046875, 0.098876953125, 0.11646270751953125, 0.1340484619140625, 0.15163421630859375, 0.169219970703125, 0.18680572509765625, 0.2043914794921875, 0.22197723388671875, 0.23956298828125, 0.25714874267578125, 0.2747344970703125, 0.29232025146484375, 0.309906005859375, 0.32749176025390625, 0.3450775146484375, 0.36266326904296875, 0.3802490234375, 0.39783477783203125, 0.4154205322265625, 0.43300628662109375, 0.450592041015625, 0.46817779541015625, 0.4857635498046875, 0.5033493041992188, 0.52093505859375, 0.5385208129882812, 0.5561065673828125, 0.5736923217773438, 0.591278076171875, 0.6088638305664062, 0.6264495849609375, 0.6440353393554688, 0.66162109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 13.0, 17.0, 30.0, 45.0, 53.0, 88.0, 177.0, 320.0, 736.0, 2177.0, 9480.0, 101504.0, 806593.0, 113455.0, 9968.0, 2280.0, 799.0, 365.0, 176.0, 77.0, 66.0, 38.0, 23.0, 16.0, 15.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1741943359375, -0.16762542724609375, -0.1610565185546875, -0.15448760986328125, -0.147918701171875, -0.14134979248046875, -0.1347808837890625, -0.12821197509765625, -0.12164306640625, -0.11507415771484375, -0.1085052490234375, -0.10193634033203125, -0.095367431640625, -0.08879852294921875, -0.0822296142578125, -0.07566070556640625, -0.069091796875, -0.06252288818359375, -0.0559539794921875, -0.04938507080078125, -0.042816162109375, -0.03624725341796875, -0.0296783447265625, -0.02310943603515625, -0.01654052734375, -0.00997161865234375, -0.0034027099609375, 0.00316619873046875, 0.009735107421875, 0.01630401611328125, 0.0228729248046875, 0.02944183349609375, 0.0360107421875, 0.04257965087890625, 0.0491485595703125, 0.05571746826171875, 0.062286376953125, 0.06885528564453125, 0.0754241943359375, 0.08199310302734375, 0.08856201171875, 0.09513092041015625, 0.1016998291015625, 0.10826873779296875, 0.114837646484375, 0.12140655517578125, 0.1279754638671875, 0.13454437255859375, 0.14111328125, 0.14768218994140625, 0.1542510986328125, 0.16082000732421875, 0.167388916015625, 0.17395782470703125, 0.1805267333984375, 0.18709564208984375, 0.19366455078125, 0.20023345947265625, 0.2068023681640625, 0.21337127685546875, 0.219940185546875, 0.22650909423828125, 0.2330780029296875, 0.23964691162109375, 0.2462158203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 10.0, 5.0, 10.0, 16.0, 28.0, 30.0, 65.0, 69.0, 106.0, 124.0, 142.0, 120.0, 92.0, 63.0, 48.0, 23.0, 13.0, 18.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001919269561767578, -0.0001851152628660202, -0.0001783035695552826, -0.00017149187624454498, -0.00016468018293380737, -0.00015786848962306976, -0.00015105679631233215, -0.00014424510300159454, -0.00013743340969085693, -0.00013062171638011932, -0.00012381002306938171, -0.0001169983297586441, -0.0001101866364479065, -0.00010337494313716888, -9.656324982643127e-05, -8.975155651569366e-05, -8.293986320495605e-05, -7.612816989421844e-05, -6.931647658348083e-05, -6.250478327274323e-05, -5.5693089962005615e-05, -4.8881396651268005e-05, -4.2069703340530396e-05, -3.5258010029792786e-05, -2.8446316719055176e-05, -2.1634623408317566e-05, -1.4822930097579956e-05, -8.011236786842346e-06, -1.1995434761047363e-06, 5.6121498346328735e-06, 1.2423843145370483e-05, 1.9235536456108093e-05, 2.6047229766845703e-05, 3.285892307758331e-05, 3.967061638832092e-05, 4.648230969905853e-05, 5.329400300979614e-05, 6.010569632053375e-05, 6.691738963127136e-05, 7.372908294200897e-05, 8.054077625274658e-05, 8.735246956348419e-05, 9.41641628742218e-05, 0.00010097585618495941, 0.00010778754949569702, 0.00011459924280643463, 0.00012141093611717224, 0.00012822262942790985, 0.00013503432273864746, 0.00014184601604938507, 0.00014865770936012268, 0.0001554694026708603, 0.0001622810959815979, 0.0001690927892923355, 0.00017590448260307312, 0.00018271617591381073, 0.00018952786922454834, 0.00019633956253528595, 0.00020315125584602356, 0.00020996294915676117, 0.00021677464246749878, 0.0002235863357782364, 0.000230398029088974, 0.0002372097223997116, 0.00024402141571044922]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 9.0, 5.0, 9.0, 10.0, 15.0, 35.0, 58.0, 84.0, 188.0, 353.0, 757.0, 2014.0, 7452.0, 55792.0, 730115.0, 229255.0, 16755.0, 3489.0, 1143.0, 492.0, 222.0, 126.0, 49.0, 46.0, 23.0, 18.0, 8.0, 9.0, 5.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1810302734375, -0.1749420166015625, -0.168853759765625, -0.1627655029296875, -0.15667724609375, -0.1505889892578125, -0.144500732421875, -0.1384124755859375, -0.13232421875, -0.1262359619140625, -0.120147705078125, -0.1140594482421875, -0.10797119140625, -0.1018829345703125, -0.095794677734375, -0.0897064208984375, -0.0836181640625, -0.0775299072265625, -0.071441650390625, -0.0653533935546875, -0.05926513671875, -0.0531768798828125, -0.047088623046875, -0.0410003662109375, -0.034912109375, -0.0288238525390625, -0.022735595703125, -0.0166473388671875, -0.01055908203125, -0.0044708251953125, 0.001617431640625, 0.0077056884765625, 0.0137939453125, 0.0198822021484375, 0.025970458984375, 0.0320587158203125, 0.03814697265625, 0.0442352294921875, 0.050323486328125, 0.0564117431640625, 0.0625, 0.0685882568359375, 0.074676513671875, 0.0807647705078125, 0.08685302734375, 0.0929412841796875, 0.099029541015625, 0.1051177978515625, 0.1112060546875, 0.1172943115234375, 0.123382568359375, 0.1294708251953125, 0.13555908203125, 0.1416473388671875, 0.147735595703125, 0.1538238525390625, 0.159912109375, 0.1660003662109375, 0.172088623046875, 0.1781768798828125, 0.18426513671875, 0.1903533935546875, 0.196441650390625, 0.2025299072265625, 0.2086181640625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 10.0, 11.0, 10.0, 26.0, 34.0, 71.0, 105.0, 134.0, 183.0, 140.0, 116.0, 65.0, 33.0, 14.0, 15.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.1299571990966797, -0.12539291381835938, -0.12082862854003906, -0.11626434326171875, -0.11170005798339844, -0.10713577270507812, -0.10257148742675781, -0.0980072021484375, -0.09344291687011719, -0.08887863159179688, -0.08431434631347656, -0.07975006103515625, -0.07518577575683594, -0.07062149047851562, -0.06605720520019531, -0.061492919921875, -0.05692863464355469, -0.052364349365234375, -0.04780006408691406, -0.04323577880859375, -0.03867149353027344, -0.034107208251953125, -0.029542922973632812, -0.0249786376953125, -0.020414352416992188, -0.015850067138671875, -0.011285781860351562, -0.00672149658203125, -0.0021572113037109375, 0.002407073974609375, 0.0069713592529296875, 0.01153564453125, 0.016099929809570312, 0.020664215087890625, 0.025228500366210938, 0.02979278564453125, 0.03435707092285156, 0.038921356201171875, 0.04348564147949219, 0.0480499267578125, 0.05261421203613281, 0.057178497314453125, 0.06174278259277344, 0.06630706787109375, 0.07087135314941406, 0.07543563842773438, 0.07999992370605469, 0.084564208984375, 0.08912849426269531, 0.09369277954101562, 0.09825706481933594, 0.10282135009765625, 0.10738563537597656, 0.11194992065429688, 0.11651420593261719, 0.1210784912109375, 0.1256427764892578, 0.13020706176757812, 0.13477134704589844, 0.13933563232421875, 0.14389991760253906, 0.14846420288085938, 0.1530284881591797, 0.1575927734375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 14.0, 40.0, 80.0, 241.0, 301.0, 183.0, 75.0, 37.0, 8.0, 10.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3282575607299805, -3.192124605178833, -3.0559914112091064, -2.919858455657959, -2.7837252616882324, -2.647592306137085, -2.5114593505859375, -2.375326156616211, -2.2391929626464844, -2.103060007095337, -1.9669268131256104, -1.830793857574463, -1.6946606636047363, -1.5585277080535889, -1.4223946332931519, -1.2862615585327148, -1.1501286029815674, -1.0139955282211304, -0.8778624534606934, -0.7417294383049011, -0.6055963635444641, -0.4694632887840271, -0.33333027362823486, -0.19719719886779785, -0.06106412410736084, 0.07506893575191498, 0.2112019956111908, 0.3473350405693054, 0.48346811532974243, 0.6196011900901794, 0.7557342052459717, 0.8918672800064087, 1.0280003547668457, 1.1641334295272827, 1.3002665042877197, 1.4363994598388672, 1.5725326538085938, 1.7086656093597412, 1.8447986841201782, 1.9809317588806152, 2.117064952850342, 2.2531979084014893, 2.389331102371216, 2.5254640579223633, 2.66159725189209, 2.7977302074432373, 2.9338631629943848, 3.0699963569641113, 3.206129312515259, 3.3422622680664062, 3.478395462036133, 3.6145284175872803, 3.750661611557007, 3.8867945671081543, 4.022927761077881, 4.159060478210449, 4.295193672180176, 4.431326866149902, 4.567459583282471, 4.703592777252197, 4.839725971221924, 4.97585916519165, 5.111991882324219, 5.248125076293945, 5.384258270263672]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 12.0, 12.0, 9.0, 10.0, 22.0, 34.0, 20.0, 28.0, 35.0, 32.0, 39.0, 35.0, 37.0, 50.0, 58.0, 49.0, 52.0, 55.0, 39.0, 32.0, 43.0, 42.0, 31.0, 21.0, 27.0, 31.0, 28.0, 15.0, 8.0, 15.0, 14.0, 12.0, 11.0, 12.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.8244390487670898, -1.764106273651123, -1.7037734985351562, -1.6434407234191895, -1.5831079483032227, -1.5227751731872559, -1.462442398071289, -1.4021096229553223, -1.3417768478393555, -1.2814440727233887, -1.2211112976074219, -1.160778522491455, -1.1004457473754883, -1.0401129722595215, -0.9797801375389099, -0.9194473624229431, -0.8591145277023315, -0.7987817525863647, -0.738448977470398, -0.6781162023544312, -0.6177834272384644, -0.5574506521224976, -0.497117817401886, -0.4367850422859192, -0.3764522671699524, -0.3161194920539856, -0.2557867169380188, -0.19545391201972961, -0.13512113690376282, -0.07478836178779602, -0.014455556869506836, 0.04587721824645996, 0.10620999336242676, 0.16654276847839355, 0.22687555849552155, 0.28720834851264954, 0.34754112362861633, 0.40787389874458313, 0.4682067036628723, 0.5285394787788391, 0.5888722538948059, 0.6492050290107727, 0.7095378041267395, 0.7698706388473511, 0.8302034139633179, 0.8905361890792847, 0.9508689641952515, 1.0112017393112183, 1.071534514427185, 1.1318672895431519, 1.1922000646591187, 1.2525328397750854, 1.3128656148910522, 1.373198390007019, 1.4335312843322754, 1.4938640594482422, 1.554196834564209, 1.6145296096801758, 1.6748623847961426, 1.7351951599121094, 1.7955279350280762, 1.855860710144043, 1.9161934852600098, 1.9765262603759766, 2.0368590354919434]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 9.0, 18.0, 55.0, 171.0, 474.0, 1645.0, 7558.0, 62672.0, 4013969.0, 94875.0, 9070.0, 1997.0, 735.0, 332.0, 205.0, 116.0, 81.0, 63.0, 50.0, 39.0, 24.0, 17.0, 20.0, 17.0, 14.0, 8.0, 4.0, 8.0, 5.0, 10.0, 8.0, 4.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4463157653808594, -0.40410614013671875, -0.3618965148925781, -0.3196868896484375, -0.2774772644042969, -0.23526763916015625, -0.19305801391601562, -0.150848388671875, -0.10863876342773438, -0.06642913818359375, -0.024219512939453125, 0.0179901123046875, 0.060199737548828125, 0.10240936279296875, 0.14461898803710938, 0.18682861328125, 0.22903823852539062, 0.27124786376953125, 0.3134574890136719, 0.3556671142578125, 0.3978767395019531, 0.44008636474609375, 0.4822959899902344, 0.524505615234375, 0.5667152404785156, 0.6089248657226562, 0.6511344909667969, 0.6933441162109375, 0.7355537414550781, 0.7777633666992188, 0.8199729919433594, 0.8621826171875, 0.9043922424316406, 0.9466018676757812, 0.9888114929199219, 1.0310211181640625, 1.0732307434082031, 1.1154403686523438, 1.1576499938964844, 1.199859619140625, 1.2420692443847656, 1.2842788696289062, 1.3264884948730469, 1.3686981201171875, 1.4109077453613281, 1.4531173706054688, 1.4953269958496094, 1.53753662109375, 1.5797462463378906, 1.6219558715820312, 1.6641654968261719, 1.7063751220703125, 1.7485847473144531, 1.7907943725585938, 1.8330039978027344, 1.875213623046875, 1.9174232482910156, 1.9596328735351562, 2.001842498779297, 2.0440521240234375, 2.086261749267578, 2.1284713745117188, 2.1706809997558594, 2.212890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 12.0, 21.0, 42.0, 50.0, 88.0, 137.0, 142.0, 137.0, 128.0, 108.0, 58.0, 52.0, 18.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07281494140625, -0.06629085540771484, -0.05976676940917969, -0.05324268341064453, -0.046718597412109375, -0.04019451141357422, -0.03367042541503906, -0.027146339416503906, -0.02062225341796875, -0.014098167419433594, -0.0075740814208984375, -0.0010499954223632812, 0.005474090576171875, 0.011998176574707031, 0.018522262573242188, 0.025046348571777344, 0.0315704345703125, 0.038094520568847656, 0.04461860656738281, 0.05114269256591797, 0.057666778564453125, 0.06419086456298828, 0.07071495056152344, 0.0772390365600586, 0.08376312255859375, 0.0902872085571289, 0.09681129455566406, 0.10333538055419922, 0.10985946655273438, 0.11638355255126953, 0.12290763854980469, 0.12943172454833984, 0.135955810546875, 0.14247989654541016, 0.1490039825439453, 0.15552806854248047, 0.16205215454101562, 0.16857624053955078, 0.17510032653808594, 0.1816244125366211, 0.18814849853515625, 0.1946725845336914, 0.20119667053222656, 0.20772075653076172, 0.21424484252929688, 0.22076892852783203, 0.2272930145263672, 0.23381710052490234, 0.2403411865234375, 0.24686527252197266, 0.2533893585205078, 0.25991344451904297, 0.2664375305175781, 0.2729616165161133, 0.27948570251464844, 0.2860097885131836, 0.29253387451171875, 0.2990579605102539, 0.30558204650878906, 0.3121061325073242, 0.3186302185058594, 0.32515430450439453, 0.3316783905029297, 0.33820247650146484, 0.3447265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 10.0, 20.0, 40.0, 46.0, 109.0, 244.0, 931.0, 6807.0, 4112493.0, 68397.0, 3773.0, 823.0, 263.0, 116.0, 57.0, 42.0, 37.0, 28.0, 16.0, 11.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.30712890625, -2.1962890625, -2.08544921875, -1.974609375, -1.86376953125, -1.7529296875, -1.64208984375, -1.53125, -1.42041015625, -1.3095703125, -1.19873046875, -1.087890625, -0.97705078125, -0.8662109375, -0.75537109375, -0.64453125, -0.53369140625, -0.4228515625, -0.31201171875, -0.201171875, -0.09033203125, 0.0205078125, 0.13134765625, 0.2421875, 0.35302734375, 0.4638671875, 0.57470703125, 0.685546875, 0.79638671875, 0.9072265625, 1.01806640625, 1.12890625, 1.23974609375, 1.3505859375, 1.46142578125, 1.572265625, 1.68310546875, 1.7939453125, 1.90478515625, 2.015625, 2.12646484375, 2.2373046875, 2.34814453125, 2.458984375, 2.56982421875, 2.6806640625, 2.79150390625, 2.90234375, 3.01318359375, 3.1240234375, 3.23486328125, 3.345703125, 3.45654296875, 3.5673828125, 3.67822265625, 3.7890625, 3.89990234375, 4.0107421875, 4.12158203125, 4.232421875, 4.34326171875, 4.4541015625, 4.56494140625, 4.67578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 12.0, 25.0, 73.0, 2441.0, 1340.0, 102.0, 25.0, 16.0, 5.0, 5.0, 5.0, 2.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302978515625, -0.2753257751464844, -0.24767303466796875, -0.22002029418945312, -0.1923675537109375, -0.16471481323242188, -0.13706207275390625, -0.10940933227539062, -0.081756591796875, -0.054103851318359375, -0.02645111083984375, 0.001201629638671875, 0.0288543701171875, 0.056507110595703125, 0.08415985107421875, 0.11181259155273438, 0.13946533203125, 0.16711807250976562, 0.19477081298828125, 0.22242355346679688, 0.2500762939453125, 0.2777290344238281, 0.30538177490234375, 0.3330345153808594, 0.360687255859375, 0.3883399963378906, 0.41599273681640625, 0.4436454772949219, 0.4712982177734375, 0.4989509582519531, 0.5266036987304688, 0.5542564392089844, 0.5819091796875, 0.6095619201660156, 0.6372146606445312, 0.6648674011230469, 0.6925201416015625, 0.7201728820800781, 0.7478256225585938, 0.7754783630371094, 0.803131103515625, 0.8307838439941406, 0.8584365844726562, 0.8860893249511719, 0.9137420654296875, 0.9413948059082031, 0.9690475463867188, 0.9967002868652344, 1.02435302734375, 1.0520057678222656, 1.0796585083007812, 1.1073112487792969, 1.1349639892578125, 1.1626167297363281, 1.1902694702148438, 1.2179222106933594, 1.245574951171875, 1.2732276916503906, 1.3008804321289062, 1.3285331726074219, 1.3561859130859375, 1.3838386535644531, 1.4114913940429688, 1.4391441345214844, 1.466796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 15.0, 74.0, 447.0, 370.0, 62.0, 21.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.511024236679077, -2.3305482864379883, -2.1500725746154785, -1.9695967435836792, -1.7891209125518799, -1.6086450815200806, -1.4281692504882812, -1.247693419456482, -1.0672175884246826, -0.8867417573928833, -0.706265926361084, -0.5257900953292847, -0.34531426429748535, -0.16483843326568604, 0.01563739776611328, 0.1961132287979126, 0.3765890598297119, 0.5570648908615112, 0.7375407218933105, 0.9180165529251099, 1.0984923839569092, 1.2789682149887085, 1.4594440460205078, 1.6399198770523071, 1.8203957080841064, 2.0008716583251953, 2.181347370147705, 2.361823081970215, 2.5422990322113037, 2.7227749824523926, 2.9032506942749023, 3.083726406097412, 3.264202117919922, 3.4446778297424316, 3.6251537799835205, 3.8056297302246094, 3.986105442047119, 4.166581153869629, 4.347057342529297, 4.527533054351807, 4.708008766174316, 4.888484477996826, 5.068960189819336, 5.249436378479004, 5.429912090301514, 5.610387802124023, 5.790863990783691, 5.971339702606201, 6.151815414428711, 6.332291126251221, 6.5127668380737305, 6.693243026733398, 6.873718738555908, 7.054194450378418, 7.234670639038086, 7.415146350860596, 7.5956220626831055, 7.776097774505615, 7.956573486328125, 8.137049674987793, 8.317525863647461, 8.498001098632812, 8.67847728729248, 8.858952522277832, 9.0394287109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 12.0, 36.0, 61.0, 98.0, 131.0, 148.0, 174.0, 139.0, 77.0, 66.0, 36.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7043089866638184, -3.5832324028015137, -3.462155818939209, -3.3410792350769043, -3.2200026512145996, -3.098926067352295, -2.9778494834899902, -2.8567731380462646, -2.73569655418396, -2.6146199703216553, -2.4935433864593506, -2.372466802597046, -2.251390218734741, -2.1303138732910156, -2.009237289428711, -1.8881607055664062, -1.767084002494812, -1.6460074186325073, -1.5249308347702026, -1.4038543701171875, -1.2827777862548828, -1.1617012023925781, -1.0406246185302734, -0.9195480942726135, -0.7984715104103088, -0.6773949265480042, -0.5563184022903442, -0.43524181842803955, -0.31416526436805725, -0.19308871030807495, -0.07201212644577026, 0.04906439781188965, 0.17014098167419434, 0.29121753573417664, 0.41229408979415894, 0.5333706736564636, 0.6544471979141235, 0.7755237817764282, 0.8966003656387329, 1.017676830291748, 1.1387534141540527, 1.2598299980163574, 1.380906581878662, 1.5019831657409668, 1.623059630393982, 1.7441362142562866, 1.8652127981185913, 1.9862892627716064, 2.1073660850524902, 2.228442668914795, 2.3495192527770996, 2.4705958366394043, 2.591672420501709, 2.7127490043640137, 2.8338255882263184, 2.954901933670044, 3.0759785175323486, 3.1970551013946533, 3.318131685256958, 3.4392082691192627, 3.5602848529815674, 3.681361198425293, 3.8024377822875977, 3.9235143661499023, 4.044590950012207]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 12.0, 14.0, 20.0, 26.0, 32.0, 54.0, 86.0, 95.0, 193.0, 356.0, 633.0, 1755.0, 9214.0, 147327.0, 832089.0, 49430.0, 4734.0, 1175.0, 511.0, 282.0, 158.0, 101.0, 66.0, 50.0, 42.0, 24.0, 14.0, 17.0, 12.0, 9.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1572265625, -1.1262283325195312, -1.0952301025390625, -1.0642318725585938, -1.033233642578125, -1.0022354125976562, -0.9712371826171875, -0.9402389526367188, -0.90924072265625, -0.8782424926757812, -0.8472442626953125, -0.8162460327148438, -0.785247802734375, -0.7542495727539062, -0.7232513427734375, -0.6922531127929688, -0.6612548828125, -0.6302566528320312, -0.5992584228515625, -0.5682601928710938, -0.537261962890625, -0.5062637329101562, -0.4752655029296875, -0.44426727294921875, -0.41326904296875, -0.38227081298828125, -0.3512725830078125, -0.32027435302734375, -0.289276123046875, -0.25827789306640625, -0.2272796630859375, -0.19628143310546875, -0.165283203125, -0.13428497314453125, -0.1032867431640625, -0.07228851318359375, -0.041290283203125, -0.01029205322265625, 0.0207061767578125, 0.05170440673828125, 0.08270263671875, 0.11370086669921875, 0.1446990966796875, 0.17569732666015625, 0.206695556640625, 0.23769378662109375, 0.2686920166015625, 0.29969024658203125, 0.3306884765625, 0.36168670654296875, 0.3926849365234375, 0.42368316650390625, 0.454681396484375, 0.48567962646484375, 0.5166778564453125, 0.5476760864257812, 0.57867431640625, 0.6096725463867188, 0.6406707763671875, 0.6716690063476562, 0.702667236328125, 0.7336654663085938, 0.7646636962890625, 0.7956619262695312, 0.82666015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 16.0, 39.0, 72.0, 137.0, 164.0, 153.0, 158.0, 117.0, 76.0, 45.0, 17.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2000732421875, -0.19156455993652344, -0.18305587768554688, -0.1745471954345703, -0.16603851318359375, -0.1575298309326172, -0.14902114868164062, -0.14051246643066406, -0.1320037841796875, -0.12349510192871094, -0.11498641967773438, -0.10647773742675781, -0.09796905517578125, -0.08946037292480469, -0.08095169067382812, -0.07244300842285156, -0.063934326171875, -0.05542564392089844, -0.046916961669921875, -0.03840827941894531, -0.02989959716796875, -0.021390914916992188, -0.012882232666015625, -0.0043735504150390625, 0.0041351318359375, 0.012643814086914062, 0.021152496337890625, 0.029661178588867188, 0.03816986083984375, 0.04667854309082031, 0.055187225341796875, 0.06369590759277344, 0.07220458984375, 0.08071327209472656, 0.08922195434570312, 0.09773063659667969, 0.10623931884765625, 0.11474800109863281, 0.12325668334960938, 0.13176536560058594, 0.1402740478515625, 0.14878273010253906, 0.15729141235351562, 0.1658000946044922, 0.17430877685546875, 0.1828174591064453, 0.19132614135742188, 0.19983482360839844, 0.208343505859375, 0.21685218811035156, 0.22536087036132812, 0.2338695526123047, 0.24237823486328125, 0.2508869171142578, 0.2593955993652344, 0.26790428161621094, 0.2764129638671875, 0.28492164611816406, 0.2934303283691406, 0.3019390106201172, 0.31044769287109375, 0.3189563751220703, 0.3274650573730469, 0.33597373962402344, 0.344482421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 14.0, 12.0, 20.0, 29.0, 40.0, 77.0, 129.0, 256.0, 553.0, 1413.0, 4775.0, 20745.0, 151283.0, 701305.0, 140833.0, 19910.0, 4667.0, 1397.0, 510.0, 223.0, 134.0, 64.0, 44.0, 36.0, 19.0, 18.0, 9.0, 9.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38330078125, -0.369354248046875, -0.35540771484375, -0.341461181640625, -0.3275146484375, -0.313568115234375, -0.29962158203125, -0.285675048828125, -0.271728515625, -0.257781982421875, -0.24383544921875, -0.229888916015625, -0.2159423828125, -0.201995849609375, -0.18804931640625, -0.174102783203125, -0.16015625, -0.146209716796875, -0.13226318359375, -0.118316650390625, -0.1043701171875, -0.090423583984375, -0.07647705078125, -0.062530517578125, -0.048583984375, -0.034637451171875, -0.02069091796875, -0.006744384765625, 0.0072021484375, 0.021148681640625, 0.03509521484375, 0.049041748046875, 0.06298828125, 0.076934814453125, 0.09088134765625, 0.104827880859375, 0.1187744140625, 0.132720947265625, 0.14666748046875, 0.160614013671875, 0.174560546875, 0.188507080078125, 0.20245361328125, 0.216400146484375, 0.2303466796875, 0.244293212890625, 0.25823974609375, 0.272186279296875, 0.2861328125, 0.300079345703125, 0.31402587890625, 0.327972412109375, 0.3419189453125, 0.355865478515625, 0.36981201171875, 0.383758544921875, 0.397705078125, 0.411651611328125, 0.42559814453125, 0.439544677734375, 0.4534912109375, 0.467437744140625, 0.48138427734375, 0.495330810546875, 0.50927734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 2.0, 2.0, 5.0, 7.0, 10.0, 6.0, 9.0, 15.0, 9.0, 21.0, 24.0, 31.0, 29.0, 41.0, 35.0, 51.0, 47.0, 41.0, 51.0, 50.0, 48.0, 59.0, 64.0, 55.0, 52.0, 46.0, 32.0, 39.0, 14.0, 28.0, 16.0, 11.0, 14.0, 11.0, 10.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27880859375, -0.2684898376464844, -0.25817108154296875, -0.24785232543945312, -0.2375335693359375, -0.22721481323242188, -0.21689605712890625, -0.20657730102539062, -0.196258544921875, -0.18593978881835938, -0.17562103271484375, -0.16530227661132812, -0.1549835205078125, -0.14466476440429688, -0.13434600830078125, -0.12402725219726562, -0.11370849609375, -0.10338973999023438, -0.09307098388671875, -0.08275222778320312, -0.0724334716796875, -0.062114715576171875, -0.05179595947265625, -0.041477203369140625, -0.031158447265625, -0.020839691162109375, -0.01052093505859375, -0.000202178955078125, 0.0101165771484375, 0.020435333251953125, 0.03075408935546875, 0.041072845458984375, 0.0513916015625, 0.061710357666015625, 0.07202911376953125, 0.08234786987304688, 0.0926666259765625, 0.10298538208007812, 0.11330413818359375, 0.12362289428710938, 0.133941650390625, 0.14426040649414062, 0.15457916259765625, 0.16489791870117188, 0.1752166748046875, 0.18553543090820312, 0.19585418701171875, 0.20617294311523438, 0.21649169921875, 0.22681045532226562, 0.23712921142578125, 0.24744796752929688, 0.2577667236328125, 0.2680854797363281, 0.27840423583984375, 0.2887229919433594, 0.299041748046875, 0.3093605041503906, 0.31967926025390625, 0.3299980163574219, 0.3403167724609375, 0.3506355285644531, 0.36095428466796875, 0.3712730407714844, 0.381591796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 10.0, 16.0, 36.0, 63.0, 99.0, 194.0, 334.0, 739.0, 1841.0, 5987.0, 31854.0, 274944.0, 600614.0, 111402.0, 14493.0, 3461.0, 1262.0, 562.0, 279.0, 139.0, 81.0, 39.0, 30.0, 17.0, 10.0, 8.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15625, -0.15169334411621094, -0.14713668823242188, -0.1425800323486328, -0.13802337646484375, -0.1334667205810547, -0.12891006469726562, -0.12435340881347656, -0.1197967529296875, -0.11524009704589844, -0.11068344116210938, -0.10612678527832031, -0.10157012939453125, -0.09701347351074219, -0.09245681762695312, -0.08790016174316406, -0.083343505859375, -0.07878684997558594, -0.07423019409179688, -0.06967353820800781, -0.06511688232421875, -0.06056022644042969, -0.056003570556640625, -0.05144691467285156, -0.0468902587890625, -0.04233360290527344, -0.037776947021484375, -0.03322029113769531, -0.02866363525390625, -0.024106979370117188, -0.019550323486328125, -0.014993667602539062, -0.01043701171875, -0.0058803558349609375, -0.001323699951171875, 0.0032329559326171875, 0.00778961181640625, 0.012346267700195312, 0.016902923583984375, 0.021459579467773438, 0.0260162353515625, 0.030572891235351562, 0.035129547119140625, 0.03968620300292969, 0.04424285888671875, 0.04879951477050781, 0.053356170654296875, 0.05791282653808594, 0.062469482421875, 0.06702613830566406, 0.07158279418945312, 0.07613945007324219, 0.08069610595703125, 0.08525276184082031, 0.08980941772460938, 0.09436607360839844, 0.0989227294921875, 0.10347938537597656, 0.10803604125976562, 0.11259269714355469, 0.11714935302734375, 0.12170600891113281, 0.12626266479492188, 0.13081932067871094, 0.1353759765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 11.0, 13.0, 23.0, 38.0, 74.0, 139.0, 196.0, 173.0, 135.0, 90.0, 43.0, 32.0, 17.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019407272338867188, -0.00018336623907089233, -0.0001726597547531128, -0.00016195327043533325, -0.0001512467861175537, -0.00014054030179977417, -0.00012983381748199463, -0.00011912733316421509, -0.00010842084884643555, -9.7714364528656e-05, -8.700788021087646e-05, -7.630139589309692e-05, -6.559491157531738e-05, -5.488842725753784e-05, -4.41819429397583e-05, -3.347545862197876e-05, -2.276897430419922e-05, -1.2062489986419678e-05, -1.3560056686401367e-06, 9.350478649139404e-06, 2.0056962966918945e-05, 3.0763447284698486e-05, 4.146993160247803e-05, 5.217641592025757e-05, 6.288290023803711e-05, 7.358938455581665e-05, 8.429586887359619e-05, 9.500235319137573e-05, 0.00010570883750915527, 0.00011641532182693481, 0.00012712180614471436, 0.0001378282904624939, 0.00014853477478027344, 0.00015924125909805298, 0.00016994774341583252, 0.00018065422773361206, 0.0001913607120513916, 0.00020206719636917114, 0.00021277368068695068, 0.00022348016500473022, 0.00023418664932250977, 0.0002448931336402893, 0.00025559961795806885, 0.0002663061022758484, 0.00027701258659362793, 0.00028771907091140747, 0.000298425555229187, 0.00030913203954696655, 0.0003198385238647461, 0.00033054500818252563, 0.0003412514925003052, 0.0003519579768180847, 0.00036266446113586426, 0.0003733709454536438, 0.00038407742977142334, 0.0003947839140892029, 0.0004054903984069824, 0.00041619688272476196, 0.0004269033670425415, 0.00043760985136032104, 0.0004483163356781006, 0.0004590228199958801, 0.00046972930431365967, 0.0004804357886314392, 0.0004911422729492188]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 6.0, 4.0, 11.0, 23.0, 26.0, 51.0, 87.0, 171.0, 351.0, 722.0, 2108.0, 7758.0, 44707.0, 397484.0, 515370.0, 65506.0, 9868.0, 2593.0, 859.0, 404.0, 188.0, 103.0, 45.0, 28.0, 16.0, 14.0, 10.0, 9.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14750289916992188, -0.14290618896484375, -0.13830947875976562, -0.1337127685546875, -0.12911605834960938, -0.12451934814453125, -0.11992263793945312, -0.115325927734375, -0.11072921752929688, -0.10613250732421875, -0.10153579711914062, -0.0969390869140625, -0.09234237670898438, -0.08774566650390625, -0.08314895629882812, -0.07855224609375, -0.07395553588867188, -0.06935882568359375, -0.06476211547851562, -0.0601654052734375, -0.055568695068359375, -0.05097198486328125, -0.046375274658203125, -0.041778564453125, -0.037181854248046875, -0.03258514404296875, -0.027988433837890625, -0.0233917236328125, -0.018795013427734375, -0.01419830322265625, -0.009601593017578125, -0.0050048828125, -0.000408172607421875, 0.00418853759765625, 0.008785247802734375, 0.0133819580078125, 0.017978668212890625, 0.02257537841796875, 0.027172088623046875, 0.031768798828125, 0.036365509033203125, 0.04096221923828125, 0.045558929443359375, 0.0501556396484375, 0.054752349853515625, 0.05934906005859375, 0.06394577026367188, 0.06854248046875, 0.07313919067382812, 0.07773590087890625, 0.08233261108398438, 0.0869293212890625, 0.09152603149414062, 0.09612274169921875, 0.10071945190429688, 0.105316162109375, 0.10991287231445312, 0.11450958251953125, 0.11910629272460938, 0.1237030029296875, 0.12829971313476562, 0.13289642333984375, 0.13749313354492188, 0.14208984375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 10.0, 14.0, 26.0, 29.0, 41.0, 71.0, 97.0, 117.0, 113.0, 121.0, 104.0, 71.0, 48.0, 37.0, 39.0, 20.0, 7.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1005859375, -0.09651374816894531, -0.09244155883789062, -0.08836936950683594, -0.08429718017578125, -0.08022499084472656, -0.07615280151367188, -0.07208061218261719, -0.0680084228515625, -0.06393623352050781, -0.059864044189453125, -0.05579185485839844, -0.05171966552734375, -0.04764747619628906, -0.043575286865234375, -0.03950309753417969, -0.035430908203125, -0.03135871887207031, -0.027286529541015625, -0.023214340209960938, -0.01914215087890625, -0.015069961547851562, -0.010997772216796875, -0.0069255828857421875, -0.0028533935546875, 0.0012187957763671875, 0.005290985107421875, 0.009363174438476562, 0.01343536376953125, 0.017507553100585938, 0.021579742431640625, 0.025651931762695312, 0.02972412109375, 0.03379631042480469, 0.037868499755859375, 0.04194068908691406, 0.04601287841796875, 0.05008506774902344, 0.054157257080078125, 0.05822944641113281, 0.0623016357421875, 0.06637382507324219, 0.07044601440429688, 0.07451820373535156, 0.07859039306640625, 0.08266258239746094, 0.08673477172851562, 0.09080696105957031, 0.094879150390625, 0.09895133972167969, 0.10302352905273438, 0.10709571838378906, 0.11116790771484375, 0.11524009704589844, 0.11931228637695312, 0.12338447570800781, 0.1274566650390625, 0.1315288543701172, 0.13560104370117188, 0.13967323303222656, 0.14374542236328125, 0.14781761169433594, 0.15188980102539062, 0.1559619903564453, 0.1600341796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 9.0, 13.0, 15.0, 25.0, 48.0, 87.0, 184.0, 222.0, 194.0, 98.0, 52.0, 23.0, 15.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.639617919921875, -2.558884859085083, -2.478151798248291, -2.397418737411499, -2.316685676574707, -2.235952615737915, -2.155219554901123, -2.074486255645752, -1.9937533140182495, -1.9130202531814575, -1.8322871923446655, -1.7515541315078735, -1.670820951461792, -1.590087890625, -1.509354829788208, -1.428621768951416, -1.347888708114624, -1.267155647277832, -1.18642258644104, -1.105689525604248, -1.024956464767456, -0.9442233443260193, -0.8634902238845825, -0.7827571630477905, -0.7020241022109985, -0.6212910413742065, -0.5405579805374146, -0.4598248600959778, -0.3790917992591858, -0.2983587384223938, -0.21762564778327942, -0.13689255714416504, -0.056159257888793945, 0.02457381784915924, 0.10530689358711243, 0.1860399693250656, 0.2667730450630188, 0.3475061058998108, 0.42823919653892517, 0.5089722871780396, 0.5897053480148315, 0.6704384088516235, 0.7511714696884155, 0.8319045901298523, 0.9126376509666443, 0.9933707118034363, 1.074103832244873, 1.154836893081665, 1.235569953918457, 1.316303014755249, 1.397036075592041, 1.477769136428833, 1.558502197265625, 1.639235258102417, 1.7199684381484985, 1.8007014989852905, 1.8814345598220825, 1.9621676206588745, 2.042900800704956, 2.123633861541748, 2.20436692237854, 2.285099983215332, 2.365833044052124, 2.446566104888916, 2.527299165725708]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 10.0, 8.0, 9.0, 20.0, 22.0, 19.0, 28.0, 38.0, 41.0, 39.0, 54.0, 48.0, 61.0, 72.0, 65.0, 75.0, 55.0, 55.0, 56.0, 48.0, 37.0, 30.0, 22.0, 18.0, 15.0, 21.0, 15.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.3562161922454834, -2.291783332824707, -2.2273507118225098, -2.1629178524017334, -2.098484992980957, -2.0340521335601807, -1.9696193933486938, -1.905186653137207, -1.8407537937164307, -1.7763209342956543, -1.7118881940841675, -1.6474554538726807, -1.5830225944519043, -1.518589735031128, -1.4541569948196411, -1.3897242546081543, -1.325291395187378, -1.2608585357666016, -1.1964257955551147, -1.131993055343628, -1.0675601959228516, -1.0031273365020752, -0.9386945962905884, -0.8742617964744568, -0.8098289966583252, -0.7453961968421936, -0.680963397026062, -0.6165305972099304, -0.5520977973937988, -0.48766499757766724, -0.42323219776153564, -0.35879939794540405, -0.29436659812927246, -0.22993379831314087, -0.16550099849700928, -0.10106819868087769, -0.036635398864746094, 0.027797400951385498, 0.09223020076751709, 0.15666300058364868, 0.22109580039978027, 0.28552860021591187, 0.34996140003204346, 0.41439419984817505, 0.47882699966430664, 0.5432597994804382, 0.6076925992965698, 0.6721253991127014, 0.736558198928833, 0.8009909987449646, 0.8654237985610962, 0.9298565983772278, 0.9942893981933594, 1.0587222576141357, 1.1231549978256226, 1.1875877380371094, 1.2520205974578857, 1.316453456878662, 1.380886197090149, 1.4453189373016357, 1.509751796722412, 1.5741846561431885, 1.6386173963546753, 1.703050136566162, 1.7674829959869385]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 7.0, 12.0, 24.0, 43.0, 122.0, 297.0, 786.0, 4169.0, 197155.0, 3980725.0, 8616.0, 1326.0, 487.0, 227.0, 116.0, 61.0, 30.0, 23.0, 18.0, 18.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96240234375, -0.9121170043945312, -0.8618316650390625, -0.8115463256835938, -0.761260986328125, -0.7109756469726562, -0.6606903076171875, -0.6104049682617188, -0.56011962890625, -0.5098342895507812, -0.4595489501953125, -0.40926361083984375, -0.358978271484375, -0.30869293212890625, -0.2584075927734375, -0.20812225341796875, -0.1578369140625, -0.10755157470703125, -0.0572662353515625, -0.00698089599609375, 0.043304443359375, 0.09358978271484375, 0.1438751220703125, 0.19416046142578125, 0.24444580078125, 0.29473114013671875, 0.3450164794921875, 0.39530181884765625, 0.445587158203125, 0.49587249755859375, 0.5461578369140625, 0.5964431762695312, 0.646728515625, 0.6970138549804688, 0.7472991943359375, 0.7975845336914062, 0.847869873046875, 0.8981552124023438, 0.9484405517578125, 0.9987258911132812, 1.04901123046875, 1.0992965698242188, 1.1495819091796875, 1.1998672485351562, 1.250152587890625, 1.3004379272460938, 1.3507232666015625, 1.4010086059570312, 1.4512939453125, 1.5015792846679688, 1.5518646240234375, 1.6021499633789062, 1.652435302734375, 1.7027206420898438, 1.7530059814453125, 1.8032913208007812, 1.85357666015625, 1.9038619995117188, 1.9541473388671875, 2.0044326782226562, 2.054718017578125, 2.1050033569335938, 2.1552886962890625, 2.2055740356445312, 2.255859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 17.0, 32.0, 67.0, 105.0, 144.0, 144.0, 140.0, 138.0, 102.0, 62.0, 31.0, 18.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180419921875, -0.1722259521484375, -0.164031982421875, -0.1558380126953125, -0.14764404296875, -0.1394500732421875, -0.131256103515625, -0.1230621337890625, -0.1148681640625, -0.1066741943359375, -0.098480224609375, -0.0902862548828125, -0.08209228515625, -0.0738983154296875, -0.065704345703125, -0.0575103759765625, -0.04931640625, -0.0411224365234375, -0.032928466796875, -0.0247344970703125, -0.01654052734375, -0.0083465576171875, -0.000152587890625, 0.0080413818359375, 0.0162353515625, 0.0244293212890625, 0.032623291015625, 0.0408172607421875, 0.04901123046875, 0.0572052001953125, 0.065399169921875, 0.0735931396484375, 0.081787109375, 0.0899810791015625, 0.098175048828125, 0.1063690185546875, 0.11456298828125, 0.1227569580078125, 0.130950927734375, 0.1391448974609375, 0.1473388671875, 0.1555328369140625, 0.163726806640625, 0.1719207763671875, 0.18011474609375, 0.1883087158203125, 0.196502685546875, 0.2046966552734375, 0.212890625, 0.2210845947265625, 0.229278564453125, 0.2374725341796875, 0.24566650390625, 0.2538604736328125, 0.262054443359375, 0.2702484130859375, 0.2784423828125, 0.2866363525390625, 0.294830322265625, 0.3030242919921875, 0.31121826171875, 0.3194122314453125, 0.327606201171875, 0.3358001708984375, 0.343994140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 3.0, 8.0, 11.0, 18.0, 30.0, 29.0, 37.0, 45.0, 54.0, 79.0, 130.0, 438.0, 8088.0, 4179044.0, 5613.0, 301.0, 124.0, 72.0, 44.0, 34.0, 20.0, 24.0, 16.0, 7.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59375, -2.516265869140625, -2.43878173828125, -2.361297607421875, -2.2838134765625, -2.206329345703125, -2.12884521484375, -2.051361083984375, -1.973876953125, -1.896392822265625, -1.81890869140625, -1.741424560546875, -1.6639404296875, -1.586456298828125, -1.50897216796875, -1.431488037109375, -1.35400390625, -1.276519775390625, -1.19903564453125, -1.121551513671875, -1.0440673828125, -0.966583251953125, -0.88909912109375, -0.811614990234375, -0.734130859375, -0.656646728515625, -0.57916259765625, -0.501678466796875, -0.4241943359375, -0.346710205078125, -0.26922607421875, -0.191741943359375, -0.1142578125, -0.036773681640625, 0.04071044921875, 0.118194580078125, 0.1956787109375, 0.273162841796875, 0.35064697265625, 0.428131103515625, 0.505615234375, 0.583099365234375, 0.66058349609375, 0.738067626953125, 0.8155517578125, 0.893035888671875, 0.97052001953125, 1.048004150390625, 1.12548828125, 1.202972412109375, 1.28045654296875, 1.357940673828125, 1.4354248046875, 1.512908935546875, 1.59039306640625, 1.667877197265625, 1.745361328125, 1.822845458984375, 1.90032958984375, 1.977813720703125, 2.0552978515625, 2.132781982421875, 2.21026611328125, 2.287750244140625, 2.365234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 10.0, 32.0, 159.0, 3399.0, 407.0, 46.0, 14.0, 4.0, 4.0], "bins": [-1.076171875, -1.0578393936157227, -1.0395069122314453, -1.021174430847168, -1.0028419494628906, -0.9845094680786133, -0.9661769866943359, -0.9478445053100586, -0.9295120239257812, -0.9111795425415039, -0.8928470611572266, -0.8745145797729492, -0.8561820983886719, -0.8378496170043945, -0.8195171356201172, -0.8011846542358398, -0.7828521728515625, -0.7645196914672852, -0.7461872100830078, -0.7278547286987305, -0.7095222473144531, -0.6911897659301758, -0.6728572845458984, -0.6545248031616211, -0.6361923217773438, -0.6178598403930664, -0.5995273590087891, -0.5811948776245117, -0.5628623962402344, -0.544529914855957, -0.5261974334716797, -0.5078649520874023, -0.489532470703125, -0.47119998931884766, -0.4528675079345703, -0.43453502655029297, -0.4162025451660156, -0.3978700637817383, -0.37953758239746094, -0.3612051010131836, -0.34287261962890625, -0.3245401382446289, -0.30620765686035156, -0.2878751754760742, -0.2695426940917969, -0.25121021270751953, -0.2328777313232422, -0.21454524993896484, -0.1962127685546875, -0.17788028717041016, -0.1595478057861328, -0.14121532440185547, -0.12288284301757812, -0.10455036163330078, -0.08621788024902344, -0.0678853988647461, -0.04955291748046875, -0.031220436096191406, -0.012887954711914062, 0.005444526672363281, 0.023777008056640625, 0.04210948944091797, 0.06044197082519531, 0.07877445220947266, 0.09710693359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 30.0, 823.0, 146.0, 11.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.311243057250977, -12.036275863647461, -11.761307716369629, -11.486340522766113, -11.211372375488281, -10.936405181884766, -10.66143798828125, -10.386469841003418, -10.111502647399902, -9.836535453796387, -9.561567306518555, -9.286600112915039, -9.011631965637207, -8.736664772033691, -8.46169662475586, -8.186729431152344, -7.91176176071167, -7.636794090270996, -7.361826419830322, -7.086858749389648, -6.811891555786133, -6.536923885345459, -6.261956214904785, -5.986988544464111, -5.7120208740234375, -5.437053203582764, -5.16208553314209, -4.887118339538574, -4.6121506690979, -4.337182998657227, -4.062215328216553, -3.787247657775879, -3.512279987335205, -3.2373123168945312, -2.9623448848724365, -2.6873772144317627, -2.412409782409668, -2.137442111968994, -1.8624744415283203, -1.587506890296936, -1.3125393390655518, -1.0375717878341675, -0.7626041769981384, -0.4876365661621094, -0.2126690149307251, 0.06229853630065918, 0.337266206741333, 0.6122337579727173, 0.8872013092041016, 1.1621688604354858, 1.4371364116668701, 1.712104082107544, 1.9870716333389282, 2.2620391845703125, 2.5370068550109863, 2.81197452545166, 3.086941957473755, 3.3619096279144287, 3.6368770599365234, 3.9118447303771973, 4.186812400817871, 4.461779594421387, 4.736747741699219, 5.011714935302734, 5.286682605743408]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 9.0, 43.0, 83.0, 171.0, 241.0, 229.0, 139.0, 58.0, 22.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.085524082183838, -2.99118709564209, -2.8968498706817627, -2.8025128841400146, -2.7081756591796875, -2.6138386726379395, -2.5195016860961914, -2.4251644611358643, -2.330827236175537, -2.236490249633789, -2.142153024673462, -2.047816038131714, -1.9534788131713867, -1.8591418266296387, -1.764804720878601, -1.6704676151275635, -1.5761306285858154, -1.4817935228347778, -1.3874564170837402, -1.2931194305419922, -1.198782205581665, -1.104445219039917, -1.0101081132888794, -0.9157710075378418, -0.8214339017868042, -0.7270967960357666, -0.632759690284729, -0.5384226441383362, -0.4440855383872986, -0.349748432636261, -0.25541138648986816, -0.16107428073883057, -0.06673693656921387, 0.027600154280662537, 0.12193724513053894, 0.21627432107925415, 0.31061142683029175, 0.40494853258132935, 0.49928557872772217, 0.5936226844787598, 0.6879597902297974, 0.782296895980835, 0.8766340017318726, 0.9709710478782654, 1.0653080940246582, 1.1596453189849854, 1.2539823055267334, 1.348319411277771, 1.4426565170288086, 1.5369936227798462, 1.6313307285308838, 1.7256677150726318, 1.820004940032959, 1.914341926574707, 2.008678913116455, 2.1030161380767822, 2.1973533630371094, 2.2916903495788574, 2.3860275745391846, 2.4803645610809326, 2.5747017860412598, 2.669038772583008, 2.763375759124756, 2.857712984085083, 2.952049970626831]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 5.0, 7.0, 5.0, 9.0, 13.0, 23.0, 29.0, 33.0, 40.0, 72.0, 102.0, 132.0, 192.0, 309.0, 548.0, 1069.0, 2643.0, 8909.0, 47131.0, 394717.0, 513222.0, 62248.0, 11074.0, 3083.0, 1232.0, 633.0, 378.0, 189.0, 144.0, 98.0, 59.0, 55.0, 42.0, 34.0, 23.0, 9.0, 7.0, 11.0, 4.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302734375, -0.5137405395507812, -0.4972076416015625, -0.48067474365234375, -0.464141845703125, -0.44760894775390625, -0.4310760498046875, -0.41454315185546875, -0.39801025390625, -0.38147735595703125, -0.3649444580078125, -0.34841156005859375, -0.331878662109375, -0.31534576416015625, -0.2988128662109375, -0.28227996826171875, -0.2657470703125, -0.24921417236328125, -0.2326812744140625, -0.21614837646484375, -0.199615478515625, -0.18308258056640625, -0.1665496826171875, -0.15001678466796875, -0.13348388671875, -0.11695098876953125, -0.1004180908203125, -0.08388519287109375, -0.067352294921875, -0.05081939697265625, -0.0342864990234375, -0.01775360107421875, -0.001220703125, 0.01531219482421875, 0.0318450927734375, 0.04837799072265625, 0.064910888671875, 0.08144378662109375, 0.0979766845703125, 0.11450958251953125, 0.13104248046875, 0.14757537841796875, 0.1641082763671875, 0.18064117431640625, 0.197174072265625, 0.21370697021484375, 0.2302398681640625, 0.24677276611328125, 0.2633056640625, 0.27983856201171875, 0.2963714599609375, 0.31290435791015625, 0.329437255859375, 0.34597015380859375, 0.3625030517578125, 0.37903594970703125, 0.39556884765625, 0.41210174560546875, 0.4286346435546875, 0.44516754150390625, 0.461700439453125, 0.47823333740234375, 0.4947662353515625, 0.5112991333007812, 0.52783203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 12.0, 13.0, 24.0, 51.0, 80.0, 75.0, 120.0, 114.0, 138.0, 121.0, 98.0, 79.0, 34.0, 24.0, 13.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17172622680664062, -0.16559600830078125, -0.15946578979492188, -0.1533355712890625, -0.14720535278320312, -0.14107513427734375, -0.13494491577148438, -0.128814697265625, -0.12268447875976562, -0.11655426025390625, -0.11042404174804688, -0.1042938232421875, -0.09816360473632812, -0.09203338623046875, -0.08590316772460938, -0.07977294921875, -0.07364273071289062, -0.06751251220703125, -0.061382293701171875, -0.0552520751953125, -0.049121856689453125, -0.04299163818359375, -0.036861419677734375, -0.030731201171875, -0.024600982666015625, -0.01847076416015625, -0.012340545654296875, -0.0062103271484375, -8.0108642578125e-05, 0.00605010986328125, 0.012180328369140625, 0.018310546875, 0.024440765380859375, 0.03057098388671875, 0.036701202392578125, 0.0428314208984375, 0.048961639404296875, 0.05509185791015625, 0.061222076416015625, 0.067352294921875, 0.07348251342773438, 0.07961273193359375, 0.08574295043945312, 0.0918731689453125, 0.09800338745117188, 0.10413360595703125, 0.11026382446289062, 0.11639404296875, 0.12252426147460938, 0.12865447998046875, 0.13478469848632812, 0.1409149169921875, 0.14704513549804688, 0.15317535400390625, 0.15930557250976562, 0.165435791015625, 0.17156600952148438, 0.17769622802734375, 0.18382644653320312, 0.1899566650390625, 0.19608688354492188, 0.20221710205078125, 0.20834732055664062, 0.2144775390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 18.0, 12.0, 22.0, 30.0, 48.0, 64.0, 78.0, 124.0, 185.0, 337.0, 536.0, 995.0, 2011.0, 4528.0, 11690.0, 33327.0, 114192.0, 420331.0, 332558.0, 84531.0, 25815.0, 9425.0, 3823.0, 1651.0, 861.0, 477.0, 291.0, 179.0, 109.0, 90.0, 55.0, 30.0, 33.0, 16.0, 13.0, 14.0, 8.0, 10.0, 1.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2506828308105469, -0.24282073974609375, -0.23495864868164062, -0.2270965576171875, -0.21923446655273438, -0.21137237548828125, -0.20351028442382812, -0.195648193359375, -0.18778610229492188, -0.17992401123046875, -0.17206192016601562, -0.1641998291015625, -0.15633773803710938, -0.14847564697265625, -0.14061355590820312, -0.13275146484375, -0.12488937377929688, -0.11702728271484375, -0.10916519165039062, -0.1013031005859375, -0.09344100952148438, -0.08557891845703125, -0.07771682739257812, -0.069854736328125, -0.061992645263671875, -0.05413055419921875, -0.046268463134765625, -0.0384063720703125, -0.030544281005859375, -0.02268218994140625, -0.014820098876953125, -0.0069580078125, 0.000904083251953125, 0.00876617431640625, 0.016628265380859375, 0.0244903564453125, 0.032352447509765625, 0.04021453857421875, 0.048076629638671875, 0.055938720703125, 0.06380081176757812, 0.07166290283203125, 0.07952499389648438, 0.0873870849609375, 0.09524917602539062, 0.10311126708984375, 0.11097335815429688, 0.11883544921875, 0.12669754028320312, 0.13455963134765625, 0.14242172241210938, 0.1502838134765625, 0.15814590454101562, 0.16600799560546875, 0.17387008666992188, 0.181732177734375, 0.18959426879882812, 0.19745635986328125, 0.20531845092773438, 0.2131805419921875, 0.22104263305664062, 0.22890472412109375, 0.23676681518554688, 0.24462890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 6.0, 8.0, 6.0, 6.0, 15.0, 14.0, 17.0, 21.0, 15.0, 29.0, 32.0, 27.0, 41.0, 45.0, 43.0, 33.0, 61.0, 50.0, 44.0, 35.0, 55.0, 42.0, 42.0, 36.0, 30.0, 29.0, 28.0, 30.0, 24.0, 22.0, 17.0, 21.0, 20.0, 7.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.306396484375, -0.2976531982421875, -0.288909912109375, -0.2801666259765625, -0.27142333984375, -0.2626800537109375, -0.253936767578125, -0.2451934814453125, -0.2364501953125, -0.2277069091796875, -0.218963623046875, -0.2102203369140625, -0.20147705078125, -0.1927337646484375, -0.183990478515625, -0.1752471923828125, -0.16650390625, -0.1577606201171875, -0.149017333984375, -0.1402740478515625, -0.13153076171875, -0.1227874755859375, -0.114044189453125, -0.1053009033203125, -0.0965576171875, -0.0878143310546875, -0.079071044921875, -0.0703277587890625, -0.06158447265625, -0.0528411865234375, -0.044097900390625, -0.0353546142578125, -0.026611328125, -0.0178680419921875, -0.009124755859375, -0.0003814697265625, 0.00836181640625, 0.0171051025390625, 0.025848388671875, 0.0345916748046875, 0.0433349609375, 0.0520782470703125, 0.060821533203125, 0.0695648193359375, 0.07830810546875, 0.0870513916015625, 0.095794677734375, 0.1045379638671875, 0.11328125, 0.1220245361328125, 0.130767822265625, 0.1395111083984375, 0.14825439453125, 0.1569976806640625, 0.165740966796875, 0.1744842529296875, 0.1832275390625, 0.1919708251953125, 0.200714111328125, 0.2094573974609375, 0.21820068359375, 0.2269439697265625, 0.235687255859375, 0.2444305419921875, 0.253173828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 13.0, 20.0, 32.0, 81.0, 131.0, 327.0, 906.0, 3290.0, 23366.0, 405674.0, 572100.0, 36529.0, 4228.0, 1107.0, 398.0, 162.0, 79.0, 36.0, 19.0, 20.0, 6.0, 9.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.259521484375, -0.2537651062011719, -0.24800872802734375, -0.24225234985351562, -0.2364959716796875, -0.23073959350585938, -0.22498321533203125, -0.21922683715820312, -0.213470458984375, -0.20771408081054688, -0.20195770263671875, -0.19620132446289062, -0.1904449462890625, -0.18468856811523438, -0.17893218994140625, -0.17317581176757812, -0.16741943359375, -0.16166305541992188, -0.15590667724609375, -0.15015029907226562, -0.1443939208984375, -0.13863754272460938, -0.13288116455078125, -0.12712478637695312, -0.121368408203125, -0.11561203002929688, -0.10985565185546875, -0.10409927368164062, -0.0983428955078125, -0.09258651733398438, -0.08683013916015625, -0.08107376098632812, -0.0753173828125, -0.06956100463867188, -0.06380462646484375, -0.058048248291015625, -0.0522918701171875, -0.046535491943359375, -0.04077911376953125, -0.035022735595703125, -0.029266357421875, -0.023509979248046875, -0.01775360107421875, -0.011997222900390625, -0.0062408447265625, -0.000484466552734375, 0.00527191162109375, 0.011028289794921875, 0.01678466796875, 0.022541046142578125, 0.02829742431640625, 0.034053802490234375, 0.0398101806640625, 0.045566558837890625, 0.05132293701171875, 0.057079315185546875, 0.062835693359375, 0.06859207153320312, 0.07434844970703125, 0.08010482788085938, 0.0858612060546875, 0.09161758422851562, 0.09737396240234375, 0.10313034057617188, 0.10888671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 9.0, 15.0, 13.0, 18.0, 27.0, 36.0, 34.0, 49.0, 85.0, 93.0, 102.0, 101.0, 98.0, 81.0, 51.0, 57.0, 30.0, 36.0, 16.0, 13.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022554397583007812, -0.0002199411392211914, -0.0002143383026123047, -0.00020873546600341797, -0.00020313262939453125, -0.00019752979278564453, -0.0001919269561767578, -0.0001863241195678711, -0.00018072128295898438, -0.00017511844635009766, -0.00016951560974121094, -0.00016391277313232422, -0.0001583099365234375, -0.00015270709991455078, -0.00014710426330566406, -0.00014150142669677734, -0.00013589859008789062, -0.0001302957534790039, -0.0001246929168701172, -0.00011909008026123047, -0.00011348724365234375, -0.00010788440704345703, -0.00010228157043457031, -9.66787338256836e-05, -9.107589721679688e-05, -8.547306060791016e-05, -7.987022399902344e-05, -7.426738739013672e-05, -6.866455078125e-05, -6.306171417236328e-05, -5.745887756347656e-05, -5.1856040954589844e-05, -4.6253204345703125e-05, -4.0650367736816406e-05, -3.504753112792969e-05, -2.944469451904297e-05, -2.384185791015625e-05, -1.823902130126953e-05, -1.2636184692382812e-05, -7.033348083496094e-06, -1.430511474609375e-06, 4.172325134277344e-06, 9.775161743164062e-06, 1.537799835205078e-05, 2.09808349609375e-05, 2.658367156982422e-05, 3.218650817871094e-05, 3.7789344787597656e-05, 4.3392181396484375e-05, 4.8995018005371094e-05, 5.459785461425781e-05, 6.020069122314453e-05, 6.580352783203125e-05, 7.140636444091797e-05, 7.700920104980469e-05, 8.26120376586914e-05, 8.821487426757812e-05, 9.381771087646484e-05, 9.942054748535156e-05, 0.00010502338409423828, 0.000110626220703125, 0.00011622905731201172, 0.00012183189392089844, 0.00012743473052978516, 0.00013303756713867188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 9.0, 18.0, 36.0, 76.0, 157.0, 334.0, 831.0, 2467.0, 11892.0, 145975.0, 752602.0, 119803.0, 10574.0, 2339.0, 826.0, 290.0, 130.0, 73.0, 46.0, 17.0, 13.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19482421875, -0.1894817352294922, -0.18413925170898438, -0.17879676818847656, -0.17345428466796875, -0.16811180114746094, -0.16276931762695312, -0.1574268341064453, -0.1520843505859375, -0.1467418670654297, -0.14139938354492188, -0.13605690002441406, -0.13071441650390625, -0.12537193298339844, -0.12002944946289062, -0.11468696594238281, -0.109344482421875, -0.10400199890136719, -0.09865951538085938, -0.09331703186035156, -0.08797454833984375, -0.08263206481933594, -0.07728958129882812, -0.07194709777832031, -0.0666046142578125, -0.06126213073730469, -0.055919647216796875, -0.05057716369628906, -0.04523468017578125, -0.03989219665527344, -0.034549713134765625, -0.029207229614257812, -0.02386474609375, -0.018522262573242188, -0.013179779052734375, -0.007837295532226562, -0.00249481201171875, 0.0028476715087890625, 0.008190155029296875, 0.013532638549804688, 0.0188751220703125, 0.024217605590820312, 0.029560089111328125, 0.03490257263183594, 0.04024505615234375, 0.04558753967285156, 0.050930023193359375, 0.05627250671386719, 0.061614990234375, 0.06695747375488281, 0.07229995727539062, 0.07764244079589844, 0.08298492431640625, 0.08832740783691406, 0.09366989135742188, 0.09901237487792969, 0.1043548583984375, 0.10969734191894531, 0.11503982543945312, 0.12038230895996094, 0.12572479248046875, 0.13106727600097656, 0.13640975952148438, 0.1417522430419922, 0.1470947265625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 16.0, 23.0, 44.0, 48.0, 78.0, 94.0, 108.0, 137.0, 107.0, 78.0, 82.0, 57.0, 38.0, 18.0, 22.0, 12.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.1376953125, -0.1342153549194336, -0.1307353973388672, -0.12725543975830078, -0.12377548217773438, -0.12029552459716797, -0.11681556701660156, -0.11333560943603516, -0.10985565185546875, -0.10637569427490234, -0.10289573669433594, -0.09941577911376953, -0.09593582153320312, -0.09245586395263672, -0.08897590637207031, -0.0854959487915039, -0.0820159912109375, -0.0785360336303711, -0.07505607604980469, -0.07157611846923828, -0.06809616088867188, -0.06461620330810547, -0.06113624572753906, -0.057656288146972656, -0.05417633056640625, -0.050696372985839844, -0.04721641540527344, -0.04373645782470703, -0.040256500244140625, -0.03677654266357422, -0.03329658508300781, -0.029816627502441406, -0.026336669921875, -0.022856712341308594, -0.019376754760742188, -0.01589679718017578, -0.012416839599609375, -0.008936882019042969, -0.0054569244384765625, -0.0019769668579101562, 0.00150299072265625, 0.004982948303222656, 0.008462905883789062, 0.011942863464355469, 0.015422821044921875, 0.01890277862548828, 0.022382736206054688, 0.025862693786621094, 0.0293426513671875, 0.032822608947753906, 0.03630256652832031, 0.03978252410888672, 0.043262481689453125, 0.04674243927001953, 0.05022239685058594, 0.053702354431152344, 0.05718231201171875, 0.060662269592285156, 0.06414222717285156, 0.06762218475341797, 0.07110214233398438, 0.07458209991455078, 0.07806205749511719, 0.0815420150756836, 0.08502197265625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 18.0, 41.0, 96.0, 224.0, 334.0, 181.0, 59.0, 19.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9431120157241821, -1.8247101306915283, -1.7063082456588745, -1.5879063606262207, -1.469504475593567, -1.351102590560913, -1.2327005863189697, -1.1142988204956055, -0.9958968758583069, -0.8774949908256531, -0.7590931057929993, -0.6406911611557007, -0.5222892761230469, -0.40388739109039307, -0.28548550605773926, -0.16708362102508545, -0.04868173599243164, 0.06972015649080276, 0.18812204897403717, 0.3065239489078522, 0.424925833940506, 0.5433277487754822, 0.661729633808136, 0.7801315188407898, 0.8985334038734436, 1.0169353485107422, 1.135337233543396, 1.2537391185760498, 1.3721410036087036, 1.4905428886413574, 1.6089447736740112, 1.727346658706665, 1.8457486629486084, 1.9641505479812622, 2.082552433013916, 2.2009544372558594, 2.3193562030792236, 2.437758207321167, 2.5561599731445312, 2.6745619773864746, 2.792963743209839, 2.9113657474517822, 3.0297675132751465, 3.14816951751709, 3.266571283340454, 3.3849732875823975, 3.5033750534057617, 3.621777057647705, 3.7401790618896484, 3.858581066131592, 3.976982831954956, 4.09538459777832, 4.213786602020264, 4.332188606262207, 4.45059061050415, 4.5689921379089355, 4.687394142150879, 4.805796146392822, 4.924198150634766, 5.042599678039551, 5.161001682281494, 5.2794036865234375, 5.397805690765381, 5.516207218170166, 5.634609222412109]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 10.0, 11.0, 11.0, 17.0, 10.0, 24.0, 15.0, 26.0, 31.0, 31.0, 26.0, 38.0, 38.0, 42.0, 45.0, 62.0, 42.0, 42.0, 42.0, 50.0, 38.0, 29.0, 38.0, 30.0, 33.0, 23.0, 30.0, 23.0, 15.0, 16.0, 10.0, 17.0, 15.0, 11.0, 5.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.556401014328003, -1.510414481163025, -1.4644279479980469, -1.4184414148330688, -1.3724548816680908, -1.3264684677124023, -1.2804818153381348, -1.2344954013824463, -1.1885088682174683, -1.1425223350524902, -1.0965358018875122, -1.0505492687225342, -1.0045627355575562, -0.9585762619972229, -0.9125897288322449, -0.8666032552719116, -0.8206166625022888, -0.7746301293373108, -0.7286435961723328, -0.6826571226119995, -0.6366705894470215, -0.5906840562820435, -0.5446975231170654, -0.4987110197544098, -0.45272448658943176, -0.40673795342445374, -0.3607514500617981, -0.31476491689682007, -0.26877838373184204, -0.2227918803691864, -0.17680534720420837, -0.13081884384155273, -0.08483231067657471, -0.038845788687467575, 0.007140733301639557, 0.05312725901603699, 0.09911377727985382, 0.14510029554367065, 0.19108682870864868, 0.23707333207130432, 0.28305986523628235, 0.3290463984012604, 0.375032901763916, 0.42101943492889404, 0.46700596809387207, 0.5129925012588501, 0.5589790344238281, 0.6049655079841614, 0.6509520411491394, 0.6969385743141174, 0.7429251074790955, 0.7889115810394287, 0.8348981142044067, 0.8808846473693848, 0.9268711805343628, 0.9728577136993408, 1.0188442468643188, 1.0648307800292969, 1.110817313194275, 1.156803846359253, 1.202790379524231, 1.248776912689209, 1.2947633266448975, 1.3407498598098755, 1.3867363929748535]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 9.0, 18.0, 34.0, 57.0, 125.0, 335.0, 1072.0, 8690.0, 4060158.0, 119018.0, 3427.0, 786.0, 272.0, 130.0, 67.0, 40.0, 16.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.3639678955078125, -1.308990478515625, -1.2540130615234375, -1.19903564453125, -1.1440582275390625, -1.089080810546875, -1.0341033935546875, -0.9791259765625, -0.9241485595703125, -0.869171142578125, -0.8141937255859375, -0.75921630859375, -0.7042388916015625, -0.649261474609375, -0.5942840576171875, -0.539306640625, -0.4843292236328125, -0.429351806640625, -0.3743743896484375, -0.31939697265625, -0.2644195556640625, -0.209442138671875, -0.1544647216796875, -0.0994873046875, -0.0445098876953125, 0.010467529296875, 0.0654449462890625, 0.12042236328125, 0.1753997802734375, 0.230377197265625, 0.2853546142578125, 0.34033203125, 0.3953094482421875, 0.450286865234375, 0.5052642822265625, 0.56024169921875, 0.6152191162109375, 0.670196533203125, 0.7251739501953125, 0.7801513671875, 0.8351287841796875, 0.890106201171875, 0.9450836181640625, 1.00006103515625, 1.0550384521484375, 1.110015869140625, 1.1649932861328125, 1.219970703125, 1.2749481201171875, 1.329925537109375, 1.3849029541015625, 1.43988037109375, 1.4948577880859375, 1.549835205078125, 1.6048126220703125, 1.6597900390625, 1.7147674560546875, 1.769744873046875, 1.8247222900390625, 1.87969970703125, 1.9346771240234375, 1.989654541015625, 2.0446319580078125, 2.099609375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 18.0, 16.0, 35.0, 51.0, 76.0, 97.0, 111.0, 124.0, 107.0, 118.0, 92.0, 56.0, 42.0, 32.0, 13.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177978515625, -0.17180252075195312, -0.16562652587890625, -0.15945053100585938, -0.1532745361328125, -0.14709854125976562, -0.14092254638671875, -0.13474655151367188, -0.128570556640625, -0.12239456176757812, -0.11621856689453125, -0.11004257202148438, -0.1038665771484375, -0.09769058227539062, -0.09151458740234375, -0.08533859252929688, -0.07916259765625, -0.07298660278320312, -0.06681060791015625, -0.060634613037109375, -0.0544586181640625, -0.048282623291015625, -0.04210662841796875, -0.035930633544921875, -0.029754638671875, -0.023578643798828125, -0.01740264892578125, -0.011226654052734375, -0.0050506591796875, 0.001125335693359375, 0.00730133056640625, 0.013477325439453125, 0.0196533203125, 0.025829315185546875, 0.03200531005859375, 0.038181304931640625, 0.0443572998046875, 0.050533294677734375, 0.05670928955078125, 0.06288528442382812, 0.069061279296875, 0.07523727416992188, 0.08141326904296875, 0.08758926391601562, 0.0937652587890625, 0.09994125366210938, 0.10611724853515625, 0.11229324340820312, 0.11846923828125, 0.12464523315429688, 0.13082122802734375, 0.13699722290039062, 0.1431732177734375, 0.14934921264648438, 0.15552520751953125, 0.16170120239257812, 0.167877197265625, 0.17405319213867188, 0.18022918701171875, 0.18640518188476562, 0.1925811767578125, 0.19875717163085938, 0.20493316650390625, 0.21110916137695312, 0.21728515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 6.0, 10.0, 27.0, 50.0, 81.0, 135.0, 261.0, 468.0, 999.0, 2248.0, 6915.0, 56262.0, 3847918.0, 259021.0, 14336.0, 3141.0, 1184.0, 549.0, 287.0, 148.0, 104.0, 55.0, 24.0, 21.0, 7.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.509124755859375, -0.49139404296875, -0.473663330078125, -0.4559326171875, -0.438201904296875, -0.42047119140625, -0.402740478515625, -0.385009765625, -0.367279052734375, -0.34954833984375, -0.331817626953125, -0.3140869140625, -0.296356201171875, -0.27862548828125, -0.260894775390625, -0.2431640625, -0.225433349609375, -0.20770263671875, -0.189971923828125, -0.1722412109375, -0.154510498046875, -0.13677978515625, -0.119049072265625, -0.101318359375, -0.083587646484375, -0.06585693359375, -0.048126220703125, -0.0303955078125, -0.012664794921875, 0.00506591796875, 0.022796630859375, 0.04052734375, 0.058258056640625, 0.07598876953125, 0.093719482421875, 0.1114501953125, 0.129180908203125, 0.14691162109375, 0.164642333984375, 0.182373046875, 0.200103759765625, 0.21783447265625, 0.235565185546875, 0.2532958984375, 0.271026611328125, 0.28875732421875, 0.306488037109375, 0.32421875, 0.341949462890625, 0.35968017578125, 0.377410888671875, 0.3951416015625, 0.412872314453125, 0.43060302734375, 0.448333740234375, 0.466064453125, 0.483795166015625, 0.50152587890625, 0.519256591796875, 0.5369873046875, 0.554718017578125, 0.57244873046875, 0.590179443359375, 0.60791015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 4.0, 7.0, 6.0, 11.0, 19.0, 14.0, 55.0, 105.0, 340.0, 2152.0, 944.0, 228.0, 93.0, 42.0, 20.0, 10.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232666015625, -0.22510910034179688, -0.21755218505859375, -0.20999526977539062, -0.2024383544921875, -0.19488143920898438, -0.18732452392578125, -0.17976760864257812, -0.172210693359375, -0.16465377807617188, -0.15709686279296875, -0.14953994750976562, -0.1419830322265625, -0.13442611694335938, -0.12686920166015625, -0.11931228637695312, -0.11175537109375, -0.10419845581054688, -0.09664154052734375, -0.08908462524414062, -0.0815277099609375, -0.07397079467773438, -0.06641387939453125, -0.058856964111328125, -0.051300048828125, -0.043743133544921875, -0.03618621826171875, -0.028629302978515625, -0.0210723876953125, -0.013515472412109375, -0.00595855712890625, 0.001598358154296875, 0.0091552734375, 0.016712188720703125, 0.02426910400390625, 0.031826019287109375, 0.0393829345703125, 0.046939849853515625, 0.05449676513671875, 0.062053680419921875, 0.069610595703125, 0.07716751098632812, 0.08472442626953125, 0.09228134155273438, 0.0998382568359375, 0.10739517211914062, 0.11495208740234375, 0.12250900268554688, 0.13006591796875, 0.13762283325195312, 0.14517974853515625, 0.15273666381835938, 0.1602935791015625, 0.16785049438476562, 0.17540740966796875, 0.18296432495117188, 0.190521240234375, 0.19807815551757812, 0.20563507080078125, 0.21319198608398438, 0.2207489013671875, 0.22830581665039062, 0.23586273193359375, 0.24341964721679688, 0.2509765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 23.0, 72.0, 290.0, 405.0, 138.0, 43.0, 16.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.630551338195801, -3.556957960128784, -3.4833643436431885, -3.409770965576172, -3.336177349090576, -3.2625839710235596, -3.188990354537964, -3.1153969764709473, -3.0418033599853516, -2.968209981918335, -2.8946163654327393, -2.8210229873657227, -2.747429370880127, -2.6738359928131104, -2.6002423763275146, -2.526648998260498, -2.4530556201934814, -2.379462242126465, -2.305868625640869, -2.2322752475738525, -2.158681631088257, -2.0850882530212402, -2.0114946365356445, -1.937901258468628, -1.8643077611923218, -1.7907142639160156, -1.7171207666397095, -1.6435272693634033, -1.5699338912963867, -1.496340274810791, -1.4227468967437744, -1.3491533994674683, -1.275559902191162, -1.201966404914856, -1.1283729076385498, -1.0547794103622437, -0.9811859726905823, -0.9075924754142761, -0.8339990377426147, -0.7604055404663086, -0.6868120431900024, -0.6132185459136963, -0.5396250486373901, -0.46603161096572876, -0.3924381136894226, -0.31884461641311646, -0.2452511489391327, -0.17165768146514893, -0.09806418418884277, -0.024470701813697815, 0.049122780561447144, 0.1227162629365921, 0.19630974531173706, 0.2699032425880432, 0.343496710062027, 0.41709017753601074, 0.4906836748123169, 0.564277172088623, 0.6378706693649292, 0.7114641070365906, 0.7850576043128967, 0.8586511015892029, 0.9322445392608643, 1.0058380365371704, 1.0794315338134766]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 15.0, 13.0, 17.0, 31.0, 31.0, 45.0, 49.0, 79.0, 85.0, 62.0, 65.0, 66.0, 67.0, 76.0, 54.0, 48.0, 66.0, 29.0, 28.0, 17.0, 15.0, 13.0, 10.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9534122943878174, -0.9284040331840515, -0.9033958315849304, -0.8783875703811646, -0.8533793091773987, -0.8283711075782776, -0.8033628463745117, -0.7783546447753906, -0.7533463835716248, -0.7283381223678589, -0.7033299207687378, -0.6783216595649719, -0.653313398361206, -0.628305196762085, -0.6032969355583191, -0.5782886743545532, -0.5532804727554321, -0.5282722115516663, -0.5032640099525452, -0.4782557487487793, -0.4532475173473358, -0.42823928594589233, -0.40323102474212646, -0.378222793340683, -0.3532145023345947, -0.32820627093315125, -0.3031980097293854, -0.2781897783279419, -0.2531815469264984, -0.22817330062389374, -0.20316505432128906, -0.17815682291984558, -0.1531485915184021, -0.12814034521579742, -0.10313211381435394, -0.07812386751174927, -0.05311562865972519, -0.02810738980770111, -0.0030991435050964355, 0.021909087896347046, 0.04691733419895172, 0.0719255730509758, 0.09693381190299988, 0.12194205820560455, 0.14695030450820923, 0.1719585359096527, 0.19696678221225739, 0.22197501361370087, 0.24698325991630554, 0.271991491317749, 0.2969997525215149, 0.3220079839229584, 0.34701621532440186, 0.3720244765281677, 0.3970327079296112, 0.4220409393310547, 0.44704920053482056, 0.47205743193626404, 0.4970656931400299, 0.5220739245414734, 0.5470821857452393, 0.5720903873443604, 0.5970986485481262, 0.6221069097518921, 0.6471151113510132]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 2.0, 7.0, 8.0, 17.0, 18.0, 33.0, 63.0, 105.0, 168.0, 423.0, 912.0, 2801.0, 13719.0, 295931.0, 703448.0, 24882.0, 3812.0, 1173.0, 498.0, 215.0, 141.0, 57.0, 39.0, 33.0, 11.0, 7.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.869140625, -0.8402938842773438, -0.8114471435546875, -0.7826004028320312, -0.753753662109375, -0.7249069213867188, -0.6960601806640625, -0.6672134399414062, -0.63836669921875, -0.6095199584960938, -0.5806732177734375, -0.5518264770507812, -0.522979736328125, -0.49413299560546875, -0.4652862548828125, -0.43643951416015625, -0.4075927734375, -0.37874603271484375, -0.3498992919921875, -0.32105255126953125, -0.292205810546875, -0.26335906982421875, -0.2345123291015625, -0.20566558837890625, -0.17681884765625, -0.14797210693359375, -0.1191253662109375, -0.09027862548828125, -0.061431884765625, -0.03258514404296875, -0.0037384033203125, 0.02510833740234375, 0.053955078125, 0.08280181884765625, 0.1116485595703125, 0.14049530029296875, 0.169342041015625, 0.19818878173828125, 0.2270355224609375, 0.25588226318359375, 0.28472900390625, 0.31357574462890625, 0.3424224853515625, 0.37126922607421875, 0.400115966796875, 0.42896270751953125, 0.4578094482421875, 0.48665618896484375, 0.5155029296875, 0.5443496704101562, 0.5731964111328125, 0.6020431518554688, 0.630889892578125, 0.6597366333007812, 0.6885833740234375, 0.7174301147460938, 0.74627685546875, 0.7751235961914062, 0.8039703369140625, 0.8328170776367188, 0.861663818359375, 0.8905105590820312, 0.9193572998046875, 0.9482040405273438, 0.97705078125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 11.0, 12.0, 14.0, 32.0, 47.0, 70.0, 87.0, 99.0, 94.0, 116.0, 110.0, 99.0, 70.0, 52.0, 36.0, 29.0, 9.0, 10.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1767578125, -0.1710987091064453, -0.16543960571289062, -0.15978050231933594, -0.15412139892578125, -0.14846229553222656, -0.14280319213867188, -0.1371440887451172, -0.1314849853515625, -0.1258258819580078, -0.12016677856445312, -0.11450767517089844, -0.10884857177734375, -0.10318946838378906, -0.09753036499023438, -0.09187126159667969, -0.086212158203125, -0.08055305480957031, -0.07489395141601562, -0.06923484802246094, -0.06357574462890625, -0.05791664123535156, -0.052257537841796875, -0.04659843444824219, -0.0409393310546875, -0.03528022766113281, -0.029621124267578125, -0.023962020874023438, -0.01830291748046875, -0.012643814086914062, -0.006984710693359375, -0.0013256072998046875, 0.00433349609375, 0.009992599487304688, 0.015651702880859375, 0.021310806274414062, 0.02696990966796875, 0.03262901306152344, 0.038288116455078125, 0.04394721984863281, 0.0496063232421875, 0.05526542663574219, 0.060924530029296875, 0.06658363342285156, 0.07224273681640625, 0.07790184020996094, 0.08356094360351562, 0.08922004699707031, 0.094879150390625, 0.10053825378417969, 0.10619735717773438, 0.11185646057128906, 0.11751556396484375, 0.12317466735839844, 0.12883377075195312, 0.1344928741455078, 0.1401519775390625, 0.1458110809326172, 0.15147018432617188, 0.15712928771972656, 0.16278839111328125, 0.16844749450683594, 0.17410659790039062, 0.1797657012939453, 0.1854248046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 5.0, 12.0, 2.0, 15.0, 15.0, 18.0, 28.0, 45.0, 67.0, 108.0, 156.0, 293.0, 646.0, 1677.0, 5105.0, 20999.0, 158455.0, 730310.0, 107785.0, 16109.0, 4136.0, 1306.0, 525.0, 285.0, 165.0, 93.0, 53.0, 39.0, 23.0, 14.0, 9.0, 8.0, 11.0, 4.0, 4.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.486572265625, -0.4728355407714844, -0.45909881591796875, -0.4453620910644531, -0.4316253662109375, -0.4178886413574219, -0.40415191650390625, -0.3904151916503906, -0.376678466796875, -0.3629417419433594, -0.34920501708984375, -0.3354682922363281, -0.3217315673828125, -0.3079948425292969, -0.29425811767578125, -0.2805213928222656, -0.26678466796875, -0.2530479431152344, -0.23931121826171875, -0.22557449340820312, -0.2118377685546875, -0.19810104370117188, -0.18436431884765625, -0.17062759399414062, -0.156890869140625, -0.14315414428710938, -0.12941741943359375, -0.11568069458007812, -0.1019439697265625, -0.08820724487304688, -0.07447052001953125, -0.060733795166015625, -0.0469970703125, -0.033260345458984375, -0.01952362060546875, -0.005786895751953125, 0.0079498291015625, 0.021686553955078125, 0.03542327880859375, 0.049160003662109375, 0.062896728515625, 0.07663345336914062, 0.09037017822265625, 0.10410690307617188, 0.1178436279296875, 0.13158035278320312, 0.14531707763671875, 0.15905380249023438, 0.17279052734375, 0.18652725219726562, 0.20026397705078125, 0.21400070190429688, 0.2277374267578125, 0.24147415161132812, 0.25521087646484375, 0.2689476013183594, 0.282684326171875, 0.2964210510253906, 0.31015777587890625, 0.3238945007324219, 0.3376312255859375, 0.3513679504394531, 0.36510467529296875, 0.3788414001464844, 0.392578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 11.0, 4.0, 10.0, 15.0, 13.0, 6.0, 25.0, 19.0, 19.0, 37.0, 44.0, 36.0, 46.0, 43.0, 46.0, 59.0, 43.0, 58.0, 45.0, 49.0, 39.0, 50.0, 40.0, 40.0, 24.0, 23.0, 28.0, 19.0, 23.0, 18.0, 8.0, 8.0, 7.0, 9.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.32275390625, -0.31243896484375, -0.3021240234375, -0.29180908203125, -0.281494140625, -0.27117919921875, -0.2608642578125, -0.25054931640625, -0.240234375, -0.22991943359375, -0.2196044921875, -0.20928955078125, -0.198974609375, -0.18865966796875, -0.1783447265625, -0.16802978515625, -0.15771484375, -0.14739990234375, -0.1370849609375, -0.12677001953125, -0.116455078125, -0.10614013671875, -0.0958251953125, -0.08551025390625, -0.0751953125, -0.06488037109375, -0.0545654296875, -0.04425048828125, -0.033935546875, -0.02362060546875, -0.0133056640625, -0.00299072265625, 0.00732421875, 0.01763916015625, 0.0279541015625, 0.03826904296875, 0.048583984375, 0.05889892578125, 0.0692138671875, 0.07952880859375, 0.08984375, 0.10015869140625, 0.1104736328125, 0.12078857421875, 0.131103515625, 0.14141845703125, 0.1517333984375, 0.16204833984375, 0.17236328125, 0.18267822265625, 0.1929931640625, 0.20330810546875, 0.213623046875, 0.22393798828125, 0.2342529296875, 0.24456787109375, 0.2548828125, 0.26519775390625, 0.2755126953125, 0.28582763671875, 0.296142578125, 0.30645751953125, 0.3167724609375, 0.32708740234375, 0.33740234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 12.0, 20.0, 62.0, 210.0, 947.0, 21864.0, 1017566.0, 7075.0, 559.0, 146.0, 48.0, 17.0, 11.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.6359786987304688, -0.6157073974609375, -0.5954360961914062, -0.575164794921875, -0.5548934936523438, -0.5346221923828125, -0.5143508911132812, -0.49407958984375, -0.47380828857421875, -0.4535369873046875, -0.43326568603515625, -0.412994384765625, -0.39272308349609375, -0.3724517822265625, -0.35218048095703125, -0.3319091796875, -0.31163787841796875, -0.2913665771484375, -0.27109527587890625, -0.250823974609375, -0.23055267333984375, -0.2102813720703125, -0.19001007080078125, -0.16973876953125, -0.14946746826171875, -0.1291961669921875, -0.10892486572265625, -0.088653564453125, -0.06838226318359375, -0.0481109619140625, -0.02783966064453125, -0.007568359375, 0.01270294189453125, 0.0329742431640625, 0.05324554443359375, 0.073516845703125, 0.09378814697265625, 0.1140594482421875, 0.13433074951171875, 0.15460205078125, 0.17487335205078125, 0.1951446533203125, 0.21541595458984375, 0.235687255859375, 0.25595855712890625, 0.2762298583984375, 0.29650115966796875, 0.3167724609375, 0.33704376220703125, 0.3573150634765625, 0.37758636474609375, 0.397857666015625, 0.41812896728515625, 0.4384002685546875, 0.45867156982421875, 0.47894287109375, 0.49921417236328125, 0.5194854736328125, 0.5397567749023438, 0.560028076171875, 0.5802993774414062, 0.6005706787109375, 0.6208419799804688, 0.64111328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 15.0, 46.0, 110.0, 212.0, 309.0, 171.0, 85.0, 30.0, 14.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007557868957519531, -0.0007323622703552246, -0.0007089376449584961, -0.0006855130195617676, -0.0006620883941650391, -0.0006386637687683105, -0.000615239143371582, -0.0005918145179748535, -0.000568389892578125, -0.0005449652671813965, -0.000521540641784668, -0.0004981160163879395, -0.00047469139099121094, -0.0004512667655944824, -0.0004278421401977539, -0.0004044175148010254, -0.0003809928894042969, -0.00035756826400756836, -0.00033414363861083984, -0.00031071901321411133, -0.0002872943878173828, -0.0002638697624206543, -0.00024044513702392578, -0.00021702051162719727, -0.00019359588623046875, -0.00017017126083374023, -0.00014674663543701172, -0.0001233220100402832, -9.989738464355469e-05, -7.647275924682617e-05, -5.3048133850097656e-05, -2.962350845336914e-05, -6.198883056640625e-06, 1.722574234008789e-05, 4.0650367736816406e-05, 6.407499313354492e-05, 8.749961853027344e-05, 0.00011092424392700195, 0.00013434886932373047, 0.00015777349472045898, 0.0001811981201171875, 0.00020462274551391602, 0.00022804737091064453, 0.00025147199630737305, 0.00027489662170410156, 0.0002983212471008301, 0.0003217458724975586, 0.0003451704978942871, 0.0003685951232910156, 0.00039201974868774414, 0.00041544437408447266, 0.00043886899948120117, 0.0004622936248779297, 0.0004857182502746582, 0.0005091428756713867, 0.0005325675010681152, 0.0005559921264648438, 0.0005794167518615723, 0.0006028413772583008, 0.0006262660026550293, 0.0006496906280517578, 0.0006731152534484863, 0.0006965398788452148, 0.0007199645042419434, 0.0007433891296386719]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 12.0, 16.0, 35.0, 57.0, 103.0, 138.0, 297.0, 973.0, 24873.0, 1012579.0, 8239.0, 651.0, 244.0, 146.0, 78.0, 51.0, 25.0, 10.0, 8.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65576171875, -0.6377372741699219, -0.6197128295898438, -0.6016883850097656, -0.5836639404296875, -0.5656394958496094, -0.5476150512695312, -0.5295906066894531, -0.511566162109375, -0.4935417175292969, -0.47551727294921875, -0.4574928283691406, -0.4394683837890625, -0.4214439392089844, -0.40341949462890625, -0.3853950500488281, -0.36737060546875, -0.3493461608886719, -0.33132171630859375, -0.3132972717285156, -0.2952728271484375, -0.2772483825683594, -0.25922393798828125, -0.24119949340820312, -0.223175048828125, -0.20515060424804688, -0.18712615966796875, -0.16910171508789062, -0.1510772705078125, -0.13305282592773438, -0.11502838134765625, -0.09700393676757812, -0.0789794921875, -0.060955047607421875, -0.04293060302734375, -0.024906158447265625, -0.0068817138671875, 0.011142730712890625, 0.02916717529296875, 0.047191619873046875, 0.065216064453125, 0.08324050903320312, 0.10126495361328125, 0.11928939819335938, 0.1373138427734375, 0.15533828735351562, 0.17336273193359375, 0.19138717651367188, 0.20941162109375, 0.22743606567382812, 0.24546051025390625, 0.2634849548339844, 0.2815093994140625, 0.2995338439941406, 0.31755828857421875, 0.3355827331542969, 0.353607177734375, 0.3716316223144531, 0.38965606689453125, 0.4076805114746094, 0.4257049560546875, 0.4437294006347656, 0.46175384521484375, 0.4797782897949219, 0.497802734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 14.0, 24.0, 135.0, 455.0, 301.0, 57.0, 14.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5134124755859375, -0.495574951171875, -0.4777374267578125, -0.45989990234375, -0.4420623779296875, -0.424224853515625, -0.4063873291015625, -0.3885498046875, -0.3707122802734375, -0.352874755859375, -0.3350372314453125, -0.31719970703125, -0.2993621826171875, -0.281524658203125, -0.2636871337890625, -0.245849609375, -0.2280120849609375, -0.210174560546875, -0.1923370361328125, -0.17449951171875, -0.1566619873046875, -0.138824462890625, -0.1209869384765625, -0.1031494140625, -0.0853118896484375, -0.067474365234375, -0.0496368408203125, -0.03179931640625, -0.0139617919921875, 0.003875732421875, 0.0217132568359375, 0.03955078125, 0.0573883056640625, 0.075225830078125, 0.0930633544921875, 0.11090087890625, 0.1287384033203125, 0.146575927734375, 0.1644134521484375, 0.1822509765625, 0.2000885009765625, 0.217926025390625, 0.2357635498046875, 0.25360107421875, 0.2714385986328125, 0.289276123046875, 0.3071136474609375, 0.324951171875, 0.3427886962890625, 0.360626220703125, 0.3784637451171875, 0.39630126953125, 0.4141387939453125, 0.431976318359375, 0.4498138427734375, 0.4676513671875, 0.4854888916015625, 0.503326416015625, 0.5211639404296875, 0.53900146484375, 0.5568389892578125, 0.574676513671875, 0.5925140380859375, 0.6103515625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 16.0, 46.0, 121.0, 320.0, 338.0, 117.0, 28.0, 7.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.74886417388916, -4.591914176940918, -4.434964656829834, -4.278014659881592, -4.121065139770508, -3.9641153812408447, -3.8071656227111816, -3.6502156257629395, -3.4932661056518555, -3.3363163471221924, -3.1793665885925293, -3.022416830062866, -2.865467071533203, -2.70851731300354, -2.551567554473877, -2.3946175575256348, -2.2376677989959717, -2.0807180404663086, -1.9237682819366455, -1.7668185234069824, -1.6098687648773193, -1.4529190063476562, -1.2959691286087036, -1.1390193700790405, -0.9820696115493774, -0.8251198530197144, -0.6681700944900513, -0.5112202763557434, -0.3542705178260803, -0.19732075929641724, -0.040370941162109375, 0.11657881736755371, 0.2735285758972168, 0.4304783344268799, 0.587428092956543, 0.7443779110908508, 0.9013276696205139, 1.0582773685455322, 1.2152272462844849, 1.372177004814148, 1.529126763343811, 1.6860765218734741, 1.8430262804031372, 1.9999761581420898, 2.156925916671753, 2.313875675201416, 2.470825433731079, 2.627775192260742, 2.7847249507904053, 2.9416747093200684, 3.0986244678497314, 3.2555742263793945, 3.4125239849090576, 3.5694737434387207, 3.726423740386963, 3.883373260498047, 4.040323257446289, 4.197273254394531, 4.354222774505615, 4.511172771453857, 4.668122291564941, 4.825072288513184, 4.982021808624268, 5.13897180557251, 5.295921325683594]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 8.0, 6.0, 7.0, 7.0, 11.0, 11.0, 18.0, 25.0, 14.0, 27.0, 31.0, 31.0, 31.0, 38.0, 40.0, 47.0, 49.0, 48.0, 40.0, 42.0, 35.0, 48.0, 47.0, 32.0, 40.0, 39.0, 32.0, 34.0, 24.0, 15.0, 15.0, 11.0, 11.0, 14.0, 12.0, 9.0, 4.0, 5.0, 5.0, 5.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.5518990755081177, -1.5057920217514038, -1.4596848487854004, -1.4135777950286865, -1.367470622062683, -1.3213635683059692, -1.2752563953399658, -1.229149341583252, -1.183042287826538, -1.1369352340698242, -1.0908280611038208, -1.044721007347107, -0.9986138343811035, -0.9525067806243896, -0.906399667263031, -0.8602925539016724, -0.814185380935669, -0.7680782675743103, -0.7219711542129517, -0.6758641004562378, -0.6297569274902344, -0.5836498737335205, -0.5375427603721619, -0.4914356470108032, -0.4453285336494446, -0.39922142028808594, -0.3531143069267273, -0.30700722336769104, -0.2609001100063324, -0.21479299664497375, -0.1686859130859375, -0.12257879972457886, -0.07647180557250977, -0.03036469966173172, 0.015742406249046326, 0.061849504709243774, 0.10795661807060242, 0.15406373143196106, 0.20017081499099731, 0.24627792835235596, 0.2923850417137146, 0.33849215507507324, 0.3845992684364319, 0.43070635199546814, 0.4768134653568268, 0.5229206085205078, 0.5690276622772217, 0.6151347756385803, 0.661241888999939, 0.7073490023612976, 0.7534561157226562, 0.7995631694793701, 0.8456703424453735, 0.8917773962020874, 0.937884509563446, 0.9839916229248047, 1.0300986766815186, 1.0762057304382324, 1.1223129034042358, 1.1684199571609497, 1.2145271301269531, 1.260634183883667, 1.3067412376403809, 1.3528484106063843, 1.3989555835723877]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 18.0, 12.0, 29.0, 41.0, 71.0, 175.0, 337.0, 902.0, 3066.0, 23734.0, 4068376.0, 89445.0, 5676.0, 1284.0, 541.0, 243.0, 137.0, 84.0, 40.0, 24.0, 12.0, 15.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.10546875, -1.0736007690429688, -1.0417327880859375, -1.0098648071289062, -0.977996826171875, -0.9461288452148438, -0.9142608642578125, -0.8823928833007812, -0.85052490234375, -0.8186569213867188, -0.7867889404296875, -0.7549209594726562, -0.723052978515625, -0.6911849975585938, -0.6593170166015625, -0.6274490356445312, -0.5955810546875, -0.5637130737304688, -0.5318450927734375, -0.49997711181640625, -0.468109130859375, -0.43624114990234375, -0.4043731689453125, -0.37250518798828125, -0.34063720703125, -0.30876922607421875, -0.2769012451171875, -0.24503326416015625, -0.213165283203125, -0.18129730224609375, -0.1494293212890625, -0.11756134033203125, -0.085693359375, -0.05382537841796875, -0.0219573974609375, 0.00991058349609375, 0.041778564453125, 0.07364654541015625, 0.1055145263671875, 0.13738250732421875, 0.16925048828125, 0.20111846923828125, 0.2329864501953125, 0.26485443115234375, 0.296722412109375, 0.32859039306640625, 0.3604583740234375, 0.39232635498046875, 0.4241943359375, 0.45606231689453125, 0.4879302978515625, 0.5197982788085938, 0.551666259765625, 0.5835342407226562, 0.6154022216796875, 0.6472702026367188, 0.67913818359375, 0.7110061645507812, 0.7428741455078125, 0.7747421264648438, 0.806610107421875, 0.8384780883789062, 0.8703460693359375, 0.9022140502929688, 0.93408203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 7.0, 17.0, 23.0, 34.0, 62.0, 74.0, 87.0, 99.0, 106.0, 95.0, 94.0, 90.0, 68.0, 54.0, 36.0, 22.0, 11.0, 11.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.171630859375, -0.1658935546875, -0.16015625, -0.1544189453125, -0.148681640625, -0.1429443359375, -0.13720703125, -0.1314697265625, -0.125732421875, -0.1199951171875, -0.1142578125, -0.1085205078125, -0.102783203125, -0.0970458984375, -0.09130859375, -0.0855712890625, -0.079833984375, -0.0740966796875, -0.068359375, -0.0626220703125, -0.056884765625, -0.0511474609375, -0.04541015625, -0.0396728515625, -0.033935546875, -0.0281982421875, -0.0224609375, -0.0167236328125, -0.010986328125, -0.0052490234375, 0.00048828125, 0.0062255859375, 0.011962890625, 0.0177001953125, 0.0234375, 0.0291748046875, 0.034912109375, 0.0406494140625, 0.04638671875, 0.0521240234375, 0.057861328125, 0.0635986328125, 0.0693359375, 0.0750732421875, 0.080810546875, 0.0865478515625, 0.09228515625, 0.0980224609375, 0.103759765625, 0.1094970703125, 0.115234375, 0.1209716796875, 0.126708984375, 0.1324462890625, 0.13818359375, 0.1439208984375, 0.149658203125, 0.1553955078125, 0.1611328125, 0.1668701171875, 0.172607421875, 0.1783447265625, 0.18408203125, 0.1898193359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 8.0, 17.0, 19.0, 32.0, 50.0, 87.0, 134.0, 239.0, 530.0, 1250.0, 4948.0, 54928.0, 4090656.0, 35265.0, 4023.0, 1100.0, 439.0, 237.0, 143.0, 65.0, 43.0, 26.0, 14.0, 18.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8916015625, -0.8623123168945312, -0.8330230712890625, -0.8037338256835938, -0.774444580078125, -0.7451553344726562, -0.7158660888671875, -0.6865768432617188, -0.65728759765625, -0.6279983520507812, -0.5987091064453125, -0.5694198608398438, -0.540130615234375, -0.5108413696289062, -0.4815521240234375, -0.45226287841796875, -0.4229736328125, -0.39368438720703125, -0.3643951416015625, -0.33510589599609375, -0.305816650390625, -0.27652740478515625, -0.2472381591796875, -0.21794891357421875, -0.18865966796875, -0.15937042236328125, -0.1300811767578125, -0.10079193115234375, -0.071502685546875, -0.04221343994140625, -0.0129241943359375, 0.01636505126953125, 0.045654296875, 0.07494354248046875, 0.1042327880859375, 0.13352203369140625, 0.162811279296875, 0.19210052490234375, 0.2213897705078125, 0.25067901611328125, 0.27996826171875, 0.30925750732421875, 0.3385467529296875, 0.36783599853515625, 0.397125244140625, 0.42641448974609375, 0.4557037353515625, 0.48499298095703125, 0.5142822265625, 0.5435714721679688, 0.5728607177734375, 0.6021499633789062, 0.631439208984375, 0.6607284545898438, 0.6900177001953125, 0.7193069458007812, 0.74859619140625, 0.7778854370117188, 0.8071746826171875, 0.8364639282226562, 0.865753173828125, 0.8950424194335938, 0.9243316650390625, 0.9536209106445312, 0.98291015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 10.0, 9.0, 10.0, 22.0, 49.0, 168.0, 1484.0, 2027.0, 182.0, 62.0, 22.0, 11.0, 8.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30224609375, -0.2930946350097656, -0.28394317626953125, -0.2747917175292969, -0.2656402587890625, -0.2564888000488281, -0.24733734130859375, -0.23818588256835938, -0.229034423828125, -0.21988296508789062, -0.21073150634765625, -0.20158004760742188, -0.1924285888671875, -0.18327713012695312, -0.17412567138671875, -0.16497421264648438, -0.15582275390625, -0.14667129516601562, -0.13751983642578125, -0.12836837768554688, -0.1192169189453125, -0.11006546020507812, -0.10091400146484375, -0.09176254272460938, -0.082611083984375, -0.07345962524414062, -0.06430816650390625, -0.055156707763671875, -0.0460052490234375, -0.036853790283203125, -0.02770233154296875, -0.018550872802734375, -0.0093994140625, -0.000247955322265625, 0.00890350341796875, 0.018054962158203125, 0.0272064208984375, 0.036357879638671875, 0.04550933837890625, 0.054660797119140625, 0.063812255859375, 0.07296371459960938, 0.08211517333984375, 0.09126663208007812, 0.1004180908203125, 0.10956954956054688, 0.11872100830078125, 0.12787246704101562, 0.13702392578125, 0.14617538452148438, 0.15532684326171875, 0.16447830200195312, 0.1736297607421875, 0.18278121948242188, 0.19193267822265625, 0.20108413696289062, 0.210235595703125, 0.21938705444335938, 0.22853851318359375, 0.23768997192382812, 0.2468414306640625, 0.2559928894042969, 0.26514434814453125, 0.2742958068847656, 0.283447265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 15.0, 55.0, 231.0, 422.0, 198.0, 47.0, 20.0, 2.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0669002532958984, -2.0030205249786377, -1.939140796661377, -1.8752609491348267, -1.811381220817566, -1.7475014925003052, -1.6836216449737549, -1.6197419166564941, -1.5558621883392334, -1.4919824600219727, -1.428102731704712, -1.3642228841781616, -1.3003431558609009, -1.2364634275436401, -1.1725835800170898, -1.108703851699829, -1.0448241233825684, -0.9809443950653076, -0.9170646071434021, -0.8531848192214966, -0.7893050909042358, -0.7254253625869751, -0.6615455746650696, -0.5976657867431641, -0.5337860584259033, -0.4699063003063202, -0.40602654218673706, -0.34214678406715393, -0.2782670259475708, -0.21438726782798767, -0.15050750970840454, -0.08662775158882141, -0.022748231887817383, 0.04113152623176575, 0.10501128435134888, 0.168891042470932, 0.23277080059051514, 0.29665055871009827, 0.3605303168296814, 0.4244100749492645, 0.48828983306884766, 0.5521695613861084, 0.6160493493080139, 0.6799291372299194, 0.7438088655471802, 0.8076885938644409, 0.8715683817863464, 0.935448169708252, 0.9993278980255127, 1.0632076263427734, 1.1270873546600342, 1.1909672021865845, 1.2548469305038452, 1.318726658821106, 1.3826065063476562, 1.446486234664917, 1.5103659629821777, 1.5742456912994385, 1.6381254196166992, 1.7020052671432495, 1.7658849954605103, 1.829764723777771, 1.8936445713043213, 1.957524299621582, 2.0214040279388428]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 14.0, 16.0, 23.0, 30.0, 43.0, 67.0, 70.0, 90.0, 96.0, 92.0, 96.0, 82.0, 68.0, 67.0, 45.0, 28.0, 29.0, 14.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6373637914657593, -0.6132196187973022, -0.5890754461288452, -0.5649312734603882, -0.5407871007919312, -0.5166428685188293, -0.4924986958503723, -0.4683545231819153, -0.44421035051345825, -0.4200661778450012, -0.3959220051765442, -0.37177780270576477, -0.34763363003730774, -0.3234894573688507, -0.2993452548980713, -0.27520108222961426, -0.2510569095611572, -0.2269127368927002, -0.20276854932308197, -0.17862436175346375, -0.1544801890850067, -0.13033601641654968, -0.10619182884693146, -0.08204764127731323, -0.0579034686088562, -0.03375928848981857, -0.009615108370780945, 0.014529071748256683, 0.03867325186729431, 0.06281743198633194, 0.08696161210536957, 0.11110579967498779, 0.13524991273880005, 0.15939408540725708, 0.1835382729768753, 0.20768246054649353, 0.23182663321495056, 0.2559708058834076, 0.280115008354187, 0.30425918102264404, 0.3284033536911011, 0.3525475263595581, 0.37669169902801514, 0.40083590149879456, 0.4249800741672516, 0.4491242468357086, 0.47326844930648804, 0.49741262197494507, 0.5215567946434021, 0.5457009673118591, 0.5698451399803162, 0.5939893126487732, 0.618133544921875, 0.642277717590332, 0.6664218902587891, 0.6905660629272461, 0.7147102355957031, 0.7388544082641602, 0.7629985809326172, 0.7871427536010742, 0.8112869262695312, 0.8354311585426331, 0.8595753312110901, 0.8837195038795471, 0.9078636765480042]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 12.0, 20.0, 25.0, 39.0, 78.0, 126.0, 231.0, 480.0, 1251.0, 4620.0, 34030.0, 664377.0, 320260.0, 18063.0, 3109.0, 936.0, 413.0, 196.0, 112.0, 71.0, 28.0, 30.0, 12.0, 7.0, 12.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79296875, -0.7695541381835938, -0.7461395263671875, -0.7227249145507812, -0.699310302734375, -0.6758956909179688, -0.6524810791015625, -0.6290664672851562, -0.60565185546875, -0.5822372436523438, -0.5588226318359375, -0.5354080200195312, -0.511993408203125, -0.48857879638671875, -0.4651641845703125, -0.44174957275390625, -0.4183349609375, -0.39492034912109375, -0.3715057373046875, -0.34809112548828125, -0.324676513671875, -0.30126190185546875, -0.2778472900390625, -0.25443267822265625, -0.23101806640625, -0.20760345458984375, -0.1841888427734375, -0.16077423095703125, -0.137359619140625, -0.11394500732421875, -0.0905303955078125, -0.06711578369140625, -0.043701171875, -0.02028656005859375, 0.0031280517578125, 0.02654266357421875, 0.049957275390625, 0.07337188720703125, 0.0967864990234375, 0.12020111083984375, 0.14361572265625, 0.16703033447265625, 0.1904449462890625, 0.21385955810546875, 0.237274169921875, 0.26068878173828125, 0.2841033935546875, 0.30751800537109375, 0.3309326171875, 0.35434722900390625, 0.3777618408203125, 0.40117645263671875, 0.424591064453125, 0.44800567626953125, 0.4714202880859375, 0.49483489990234375, 0.51824951171875, 0.5416641235351562, 0.5650787353515625, 0.5884933471679688, 0.611907958984375, 0.6353225708007812, 0.6587371826171875, 0.6821517944335938, 0.70556640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 9.0, 17.0, 30.0, 39.0, 67.0, 73.0, 114.0, 87.0, 104.0, 112.0, 107.0, 83.0, 57.0, 49.0, 20.0, 15.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1917724609375, -0.18567848205566406, -0.17958450317382812, -0.1734905242919922, -0.16739654541015625, -0.1613025665283203, -0.15520858764648438, -0.14911460876464844, -0.1430206298828125, -0.13692665100097656, -0.13083267211914062, -0.12473869323730469, -0.11864471435546875, -0.11255073547363281, -0.10645675659179688, -0.10036277770996094, -0.094268798828125, -0.08817481994628906, -0.08208084106445312, -0.07598686218261719, -0.06989288330078125, -0.06379890441894531, -0.057704925537109375, -0.05161094665527344, -0.0455169677734375, -0.03942298889160156, -0.033329010009765625, -0.027235031127929688, -0.02114105224609375, -0.015047073364257812, -0.008953094482421875, -0.0028591156005859375, 0.00323486328125, 0.009328842163085938, 0.015422821044921875, 0.021516799926757812, 0.02761077880859375, 0.03370475769042969, 0.039798736572265625, 0.04589271545410156, 0.0519866943359375, 0.05808067321777344, 0.06417465209960938, 0.07026863098144531, 0.07636260986328125, 0.08245658874511719, 0.08855056762695312, 0.09464454650878906, 0.100738525390625, 0.10683250427246094, 0.11292648315429688, 0.11902046203613281, 0.12511444091796875, 0.1312084197998047, 0.13730239868164062, 0.14339637756347656, 0.1494903564453125, 0.15558433532714844, 0.16167831420898438, 0.1677722930908203, 0.17386627197265625, 0.1799602508544922, 0.18605422973632812, 0.19214820861816406, 0.1982421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 8.0, 8.0, 19.0, 13.0, 17.0, 38.0, 35.0, 58.0, 79.0, 135.0, 258.0, 536.0, 1709.0, 5982.0, 28431.0, 201684.0, 650360.0, 132125.0, 20249.0, 4433.0, 1307.0, 497.0, 215.0, 112.0, 58.0, 54.0, 30.0, 19.0, 19.0, 16.0, 15.0, 4.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322265625, -0.3116645812988281, -0.30106353759765625, -0.2904624938964844, -0.2798614501953125, -0.2692604064941406, -0.25865936279296875, -0.24805831909179688, -0.237457275390625, -0.22685623168945312, -0.21625518798828125, -0.20565414428710938, -0.1950531005859375, -0.18445205688476562, -0.17385101318359375, -0.16324996948242188, -0.15264892578125, -0.14204788208007812, -0.13144683837890625, -0.12084579467773438, -0.1102447509765625, -0.09964370727539062, -0.08904266357421875, -0.07844161987304688, -0.067840576171875, -0.057239532470703125, -0.04663848876953125, -0.036037445068359375, -0.0254364013671875, -0.014835357666015625, -0.00423431396484375, 0.006366729736328125, 0.0169677734375, 0.027568817138671875, 0.03816986083984375, 0.048770904541015625, 0.0593719482421875, 0.06997299194335938, 0.08057403564453125, 0.09117507934570312, 0.101776123046875, 0.11237716674804688, 0.12297821044921875, 0.13357925415039062, 0.1441802978515625, 0.15478134155273438, 0.16538238525390625, 0.17598342895507812, 0.18658447265625, 0.19718551635742188, 0.20778656005859375, 0.21838760375976562, 0.2289886474609375, 0.23958969116210938, 0.25019073486328125, 0.2607917785644531, 0.271392822265625, 0.2819938659667969, 0.29259490966796875, 0.3031959533691406, 0.3137969970703125, 0.3243980407714844, 0.33499908447265625, 0.3456001281738281, 0.356201171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 12.0, 8.0, 9.0, 11.0, 14.0, 13.0, 13.0, 14.0, 25.0, 32.0, 32.0, 29.0, 30.0, 43.0, 48.0, 41.0, 34.0, 57.0, 47.0, 49.0, 35.0, 48.0, 40.0, 45.0, 33.0, 34.0, 28.0, 24.0, 27.0, 19.0, 32.0, 20.0, 7.0, 11.0, 10.0, 3.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.273681640625, -0.2647056579589844, -0.25572967529296875, -0.24675369262695312, -0.2377777099609375, -0.22880172729492188, -0.21982574462890625, -0.21084976196289062, -0.201873779296875, -0.19289779663085938, -0.18392181396484375, -0.17494583129882812, -0.1659698486328125, -0.15699386596679688, -0.14801788330078125, -0.13904190063476562, -0.13006591796875, -0.12108993530273438, -0.11211395263671875, -0.10313796997070312, -0.0941619873046875, -0.08518600463867188, -0.07621002197265625, -0.06723403930664062, -0.058258056640625, -0.049282073974609375, -0.04030609130859375, -0.031330108642578125, -0.0223541259765625, -0.013378143310546875, -0.00440216064453125, 0.004573822021484375, 0.0135498046875, 0.022525787353515625, 0.03150177001953125, 0.040477752685546875, 0.0494537353515625, 0.058429718017578125, 0.06740570068359375, 0.07638168334960938, 0.085357666015625, 0.09433364868164062, 0.10330963134765625, 0.11228561401367188, 0.1212615966796875, 0.13023757934570312, 0.13921356201171875, 0.14818954467773438, 0.15716552734375, 0.16614151000976562, 0.17511749267578125, 0.18409347534179688, 0.1930694580078125, 0.20204544067382812, 0.21102142333984375, 0.21999740600585938, 0.228973388671875, 0.23794937133789062, 0.24692535400390625, 0.2559013366699219, 0.2648773193359375, 0.2738533020019531, 0.28282928466796875, 0.2918052673339844, 0.30078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 9.0, 3.0, 6.0, 22.0, 19.0, 34.0, 60.0, 76.0, 123.0, 210.0, 373.0, 839.0, 2303.0, 9453.0, 78605.0, 648914.0, 275873.0, 24622.0, 4485.0, 1281.0, 498.0, 274.0, 158.0, 95.0, 61.0, 47.0, 30.0, 25.0, 18.0, 14.0, 7.0, 5.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1539306640625, -0.14908218383789062, -0.14423370361328125, -0.13938522338867188, -0.1345367431640625, -0.12968826293945312, -0.12483978271484375, -0.11999130249023438, -0.115142822265625, -0.11029434204101562, -0.10544586181640625, -0.10059738159179688, -0.0957489013671875, -0.09090042114257812, -0.08605194091796875, -0.08120346069335938, -0.07635498046875, -0.07150650024414062, -0.06665802001953125, -0.061809539794921875, -0.0569610595703125, -0.052112579345703125, -0.04726409912109375, -0.042415618896484375, -0.037567138671875, -0.032718658447265625, -0.02787017822265625, -0.023021697998046875, -0.0181732177734375, -0.013324737548828125, -0.00847625732421875, -0.003627777099609375, 0.001220703125, 0.006069183349609375, 0.01091766357421875, 0.015766143798828125, 0.0206146240234375, 0.025463104248046875, 0.03031158447265625, 0.035160064697265625, 0.040008544921875, 0.044857025146484375, 0.04970550537109375, 0.054553985595703125, 0.0594024658203125, 0.06425094604492188, 0.06909942626953125, 0.07394790649414062, 0.07879638671875, 0.08364486694335938, 0.08849334716796875, 0.09334182739257812, 0.0981903076171875, 0.10303878784179688, 0.10788726806640625, 0.11273574829101562, 0.117584228515625, 0.12243270874023438, 0.12728118896484375, 0.13212966918945312, 0.1369781494140625, 0.14182662963867188, 0.14667510986328125, 0.15152359008789062, 0.1563720703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 13.0, 24.0, 41.0, 75.0, 121.0, 182.0, 183.0, 151.0, 93.0, 53.0, 28.0, 13.0, 17.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004470348358154297, -0.00043696723878383636, -0.00042689964175224304, -0.0004168320447206497, -0.0004067644476890564, -0.0003966968506574631, -0.00038662925362586975, -0.00037656165659427643, -0.0003664940595626831, -0.0003564264625310898, -0.00034635886549949646, -0.00033629126846790314, -0.0003262236714363098, -0.0003161560744047165, -0.00030608847737312317, -0.00029602088034152985, -0.0002859532833099365, -0.0002758856862783432, -0.0002658180892467499, -0.00025575049221515656, -0.00024568289518356323, -0.0002356152981519699, -0.0002255477011203766, -0.00021548010408878326, -0.00020541250705718994, -0.00019534491002559662, -0.0001852773129940033, -0.00017520971596240997, -0.00016514211893081665, -0.00015507452189922333, -0.00014500692486763, -0.00013493932783603668, -0.00012487173080444336, -0.00011480413377285004, -0.00010473653674125671, -9.466893970966339e-05, -8.460134267807007e-05, -7.453374564647675e-05, -6.446614861488342e-05, -5.43985515832901e-05, -4.433095455169678e-05, -3.4263357520103455e-05, -2.4195760488510132e-05, -1.4128163456916809e-05, -4.060566425323486e-06, 6.0070306062698364e-06, 1.607462763786316e-05, 2.6142224669456482e-05, 3.6209821701049805e-05, 4.627741873264313e-05, 5.634501576423645e-05, 6.641261279582977e-05, 7.64802098274231e-05, 8.654780685901642e-05, 9.661540389060974e-05, 0.00010668300092220306, 0.00011675059795379639, 0.0001268181949853897, 0.00013688579201698303, 0.00014695338904857635, 0.00015702098608016968, 0.000167088583111763, 0.00017715618014335632, 0.00018722377717494965, 0.00019729137420654297]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 11.0, 9.0, 20.0, 29.0, 59.0, 144.0, 286.0, 815.0, 4432.0, 71730.0, 870650.0, 93860.0, 4921.0, 972.0, 319.0, 142.0, 67.0, 31.0, 18.0, 17.0, 6.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1976318359375, -0.19045448303222656, -0.18327713012695312, -0.1760997772216797, -0.16892242431640625, -0.1617450714111328, -0.15456771850585938, -0.14739036560058594, -0.1402130126953125, -0.13303565979003906, -0.12585830688476562, -0.11868095397949219, -0.11150360107421875, -0.10432624816894531, -0.09714889526367188, -0.08997154235839844, -0.082794189453125, -0.07561683654785156, -0.06843948364257812, -0.06126213073730469, -0.05408477783203125, -0.04690742492675781, -0.039730072021484375, -0.03255271911621094, -0.0253753662109375, -0.018198013305664062, -0.011020660400390625, -0.0038433074951171875, 0.00333404541015625, 0.010511398315429688, 0.017688751220703125, 0.024866104125976562, 0.03204345703125, 0.03922080993652344, 0.046398162841796875, 0.05357551574707031, 0.06075286865234375, 0.06793022155761719, 0.07510757446289062, 0.08228492736816406, 0.0894622802734375, 0.09663963317871094, 0.10381698608398438, 0.11099433898925781, 0.11817169189453125, 0.1253490447998047, 0.13252639770507812, 0.13970375061035156, 0.146881103515625, 0.15405845642089844, 0.16123580932617188, 0.1684131622314453, 0.17559051513671875, 0.1827678680419922, 0.18994522094726562, 0.19712257385253906, 0.2042999267578125, 0.21147727966308594, 0.21865463256835938, 0.2258319854736328, 0.23300933837890625, 0.2401866912841797, 0.24736404418945312, 0.25454139709472656, 0.26171875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 15.0, 24.0, 30.0, 84.0, 131.0, 195.0, 202.0, 146.0, 90.0, 50.0, 17.0, 10.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.17106246948242188, -0.16365814208984375, -0.15625381469726562, -0.1488494873046875, -0.14144515991210938, -0.13404083251953125, -0.12663650512695312, -0.119232177734375, -0.11182785034179688, -0.10442352294921875, -0.09701919555664062, -0.0896148681640625, -0.08221054077148438, -0.07480621337890625, -0.06740188598632812, -0.05999755859375, -0.052593231201171875, -0.04518890380859375, -0.037784576416015625, -0.0303802490234375, -0.022975921630859375, -0.01557159423828125, -0.008167266845703125, -0.000762939453125, 0.006641387939453125, 0.01404571533203125, 0.021450042724609375, 0.0288543701171875, 0.036258697509765625, 0.04366302490234375, 0.051067352294921875, 0.0584716796875, 0.06587600708007812, 0.07328033447265625, 0.08068466186523438, 0.0880889892578125, 0.09549331665039062, 0.10289764404296875, 0.11030197143554688, 0.117706298828125, 0.12511062622070312, 0.13251495361328125, 0.13991928100585938, 0.1473236083984375, 0.15472793579101562, 0.16213226318359375, 0.16953659057617188, 0.17694091796875, 0.18434524536132812, 0.19174957275390625, 0.19915390014648438, 0.2065582275390625, 0.21396255493164062, 0.22136688232421875, 0.22877120971679688, 0.236175537109375, 0.24357986450195312, 0.25098419189453125, 0.2583885192871094, 0.2657928466796875, 0.2731971740722656, 0.28060150146484375, 0.2880058288574219, 0.29541015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 11.0, 31.0, 77.0, 251.0, 360.0, 204.0, 51.0, 17.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.137864589691162, -2.9975500106811523, -2.8572354316711426, -2.716920852661133, -2.576606273651123, -2.4362916946411133, -2.2959768772125244, -2.1556622982025146, -2.015347719192505, -1.8750331401824951, -1.7347185611724854, -1.594403862953186, -1.4540892839431763, -1.3137747049331665, -1.1734600067138672, -1.0331454277038574, -0.8928308486938477, -0.7525162696838379, -0.6122016310691833, -0.4718870222568512, -0.33157241344451904, -0.19125783443450928, -0.050943195819854736, 0.0893714427947998, 0.22968602180480957, 0.3700006306171417, 0.5103152394294739, 0.6506298780441284, 0.7909444570541382, 0.931259036064148, 1.0715737342834473, 1.211888313293457, 1.352203369140625, 1.4925179481506348, 1.6328325271606445, 1.7731472253799438, 1.9134618043899536, 2.053776264190674, 2.1940910816192627, 2.3344056606292725, 2.4747202396392822, 2.615034818649292, 2.7553493976593018, 2.8956639766693115, 3.0359787940979004, 3.17629337310791, 3.31660795211792, 3.4569225311279297, 3.5972371101379395, 3.737551689147949, 3.877866268157959, 4.018180847167969, 4.1584954261779785, 4.298810005187988, 4.439124584197998, 4.579439163208008, 4.719754219055176, 4.8600687980651855, 5.000383377075195, 5.140697956085205, 5.281012535095215, 5.421327114105225, 5.561641693115234, 5.701956748962402, 5.842270851135254]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 14.0, 13.0, 13.0, 18.0, 22.0, 26.0, 27.0, 30.0, 38.0, 39.0, 38.0, 40.0, 51.0, 55.0, 44.0, 70.0, 51.0, 40.0, 51.0, 51.0, 32.0, 43.0, 30.0, 31.0, 25.0, 24.0, 16.0, 16.0, 8.0, 11.0, 11.0, 7.0, 9.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.80057692527771, -1.7496801614761353, -1.6987833976745605, -1.6478866338729858, -1.5969898700714111, -1.5460931062698364, -1.4951963424682617, -1.444299578666687, -1.3934028148651123, -1.3425060510635376, -1.291609287261963, -1.2407125234603882, -1.1898157596588135, -1.1389189958572388, -1.088022232055664, -1.0371254682540894, -0.9862286448478699, -0.9353318810462952, -0.8844351172447205, -0.8335383534431458, -0.782641589641571, -0.7317447662353516, -0.6808480024337769, -0.6299512386322021, -0.5790544748306274, -0.5281577110290527, -0.477260947227478, -0.4263641834259033, -0.3754674196243286, -0.3245706260204315, -0.2736738622188568, -0.2227770984172821, -0.17188036441802979, -0.12098360061645508, -0.07008682936429977, -0.01919005811214447, 0.03170670568943024, 0.08260348439216614, 0.13350024819374084, 0.18439701199531555, 0.23529377579689026, 0.28619053959846497, 0.3370873034000397, 0.38798409700393677, 0.4388808608055115, 0.4897776246070862, 0.5406743884086609, 0.5915711522102356, 0.6424679160118103, 0.693364679813385, 0.7442614436149597, 0.7951582074165344, 0.8460549712181091, 0.8969517946243286, 0.9478485584259033, 0.998745322227478, 1.0496420860290527, 1.1005388498306274, 1.1514356136322021, 1.2023323774337769, 1.2532291412353516, 1.3041259050369263, 1.355022668838501, 1.4059194326400757, 1.4568161964416504]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 12.0, 26.0, 45.0, 71.0, 127.0, 245.0, 504.0, 1353.0, 4897.0, 35421.0, 4087816.0, 54870.0, 5985.0, 1537.0, 625.0, 301.0, 176.0, 98.0, 57.0, 31.0, 17.0, 10.0, 13.0, 7.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3095703125, -1.27056884765625, -1.2315673828125, -1.19256591796875, -1.153564453125, -1.11456298828125, -1.0755615234375, -1.03656005859375, -0.99755859375, -0.95855712890625, -0.9195556640625, -0.88055419921875, -0.841552734375, -0.80255126953125, -0.7635498046875, -0.72454833984375, -0.685546875, -0.64654541015625, -0.6075439453125, -0.56854248046875, -0.529541015625, -0.49053955078125, -0.4515380859375, -0.41253662109375, -0.37353515625, -0.33453369140625, -0.2955322265625, -0.25653076171875, -0.217529296875, -0.17852783203125, -0.1395263671875, -0.10052490234375, -0.0615234375, -0.02252197265625, 0.0164794921875, 0.05548095703125, 0.094482421875, 0.13348388671875, 0.1724853515625, 0.21148681640625, 0.25048828125, 0.28948974609375, 0.3284912109375, 0.36749267578125, 0.406494140625, 0.44549560546875, 0.4844970703125, 0.52349853515625, 0.5625, 0.60150146484375, 0.6405029296875, 0.67950439453125, 0.718505859375, 0.75750732421875, 0.7965087890625, 0.83551025390625, 0.87451171875, 0.91351318359375, 0.9525146484375, 0.99151611328125, 1.030517578125, 1.06951904296875, 1.1085205078125, 1.14752197265625, 1.1865234375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 2.0, 12.0, 13.0, 27.0, 34.0, 58.0, 70.0, 85.0, 84.0, 91.0, 110.0, 83.0, 90.0, 74.0, 52.0, 41.0, 28.0, 19.0, 13.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1939697265625, -0.1882762908935547, -0.18258285522460938, -0.17688941955566406, -0.17119598388671875, -0.16550254821777344, -0.15980911254882812, -0.1541156768798828, -0.1484222412109375, -0.1427288055419922, -0.13703536987304688, -0.13134193420410156, -0.12564849853515625, -0.11995506286621094, -0.11426162719726562, -0.10856819152832031, -0.102874755859375, -0.09718132019042969, -0.09148788452148438, -0.08579444885253906, -0.08010101318359375, -0.07440757751464844, -0.06871414184570312, -0.06302070617675781, -0.0573272705078125, -0.05163383483886719, -0.045940399169921875, -0.04024696350097656, -0.03455352783203125, -0.028860092163085938, -0.023166656494140625, -0.017473220825195312, -0.01177978515625, -0.0060863494873046875, -0.000392913818359375, 0.0053005218505859375, 0.01099395751953125, 0.016687393188476562, 0.022380828857421875, 0.028074264526367188, 0.0337677001953125, 0.03946113586425781, 0.045154571533203125, 0.05084800720214844, 0.05654144287109375, 0.06223487854003906, 0.06792831420898438, 0.07362174987792969, 0.079315185546875, 0.08500862121582031, 0.09070205688476562, 0.09639549255371094, 0.10208892822265625, 0.10778236389160156, 0.11347579956054688, 0.11916923522949219, 0.1248626708984375, 0.1305561065673828, 0.13624954223632812, 0.14194297790527344, 0.14763641357421875, 0.15332984924316406, 0.15902328491210938, 0.1647167205810547, 0.17041015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 1.0, 5.0, 3.0, 5.0, 8.0, 9.0, 14.0, 22.0, 28.0, 44.0, 58.0, 77.0, 84.0, 134.0, 221.0, 301.0, 537.0, 882.0, 1666.0, 3922.0, 15350.0, 150819.0, 3929683.0, 74154.0, 9875.0, 2942.0, 1350.0, 747.0, 418.0, 302.0, 178.0, 126.0, 75.0, 61.0, 56.0, 39.0, 24.0, 17.0, 9.0, 5.0, 8.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.517578125, -0.5005416870117188, -0.4835052490234375, -0.46646881103515625, -0.449432373046875, -0.43239593505859375, -0.4153594970703125, -0.39832305908203125, -0.38128662109375, -0.36425018310546875, -0.3472137451171875, -0.33017730712890625, -0.313140869140625, -0.29610443115234375, -0.2790679931640625, -0.26203155517578125, -0.2449951171875, -0.22795867919921875, -0.2109222412109375, -0.19388580322265625, -0.176849365234375, -0.15981292724609375, -0.1427764892578125, -0.12574005126953125, -0.10870361328125, -0.09166717529296875, -0.0746307373046875, -0.05759429931640625, -0.040557861328125, -0.02352142333984375, -0.0064849853515625, 0.01055145263671875, 0.027587890625, 0.04462432861328125, 0.0616607666015625, 0.07869720458984375, 0.095733642578125, 0.11277008056640625, 0.1298065185546875, 0.14684295654296875, 0.16387939453125, 0.18091583251953125, 0.1979522705078125, 0.21498870849609375, 0.232025146484375, 0.24906158447265625, 0.2660980224609375, 0.28313446044921875, 0.3001708984375, 0.31720733642578125, 0.3342437744140625, 0.35128021240234375, 0.368316650390625, 0.38535308837890625, 0.4023895263671875, 0.41942596435546875, 0.43646240234375, 0.45349884033203125, 0.4705352783203125, 0.48757171630859375, 0.504608154296875, 0.5216445922851562, 0.5386810302734375, 0.5557174682617188, 0.57275390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 5.0, 9.0, 12.0, 31.0, 74.0, 210.0, 2981.0, 562.0, 121.0, 36.0, 12.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.417236328125, -0.4072399139404297, -0.3972434997558594, -0.38724708557128906, -0.37725067138671875, -0.36725425720214844, -0.3572578430175781, -0.3472614288330078, -0.3372650146484375, -0.3272686004638672, -0.3172721862792969, -0.30727577209472656, -0.29727935791015625, -0.28728294372558594, -0.2772865295410156, -0.2672901153564453, -0.257293701171875, -0.2472972869873047, -0.23730087280273438, -0.22730445861816406, -0.21730804443359375, -0.20731163024902344, -0.19731521606445312, -0.1873188018798828, -0.1773223876953125, -0.1673259735107422, -0.15732955932617188, -0.14733314514160156, -0.13733673095703125, -0.12734031677246094, -0.11734390258789062, -0.10734748840332031, -0.09735107421875, -0.08735466003417969, -0.07735824584960938, -0.06736183166503906, -0.05736541748046875, -0.04736900329589844, -0.037372589111328125, -0.027376174926757812, -0.0173797607421875, -0.0073833465576171875, 0.002613067626953125, 0.012609481811523438, 0.02260589599609375, 0.03260231018066406, 0.042598724365234375, 0.05259513854980469, 0.062591552734375, 0.07258796691894531, 0.08258438110351562, 0.09258079528808594, 0.10257720947265625, 0.11257362365722656, 0.12257003784179688, 0.1325664520263672, 0.1425628662109375, 0.1525592803955078, 0.16255569458007812, 0.17255210876464844, 0.18254852294921875, 0.19254493713378906, 0.20254135131835938, 0.2125377655029297, 0.2225341796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 27.0, 131.0, 399.0, 332.0, 68.0, 11.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9986463785171509, -1.931889295578003, -1.8651320934295654, -1.7983750104904175, -1.7316179275512695, -1.6648608446121216, -1.5981037616729736, -1.5313465595245361, -1.4645894765853882, -1.3978323936462402, -1.3310751914978027, -1.2643181085586548, -1.1975610256195068, -1.1308039426803589, -1.064046859741211, -0.9972896575927734, -0.9305325746536255, -0.8637754917144775, -0.7970183491706848, -0.7302612066268921, -0.6635041236877441, -0.5967470407485962, -0.5299898982048035, -0.46323278546333313, -0.3964756727218628, -0.32971855998039246, -0.2629614472389221, -0.19620433449745178, -0.12944722175598145, -0.06269010901451111, 0.0040670037269592285, 0.07082411646842957, 0.13758111000061035, 0.2043382227420807, 0.271095335483551, 0.33785244822502136, 0.4046095609664917, 0.47136667370796204, 0.5381237864494324, 0.6048809289932251, 0.671638011932373, 0.738395094871521, 0.8051522374153137, 0.8719093799591064, 0.9386664628982544, 1.0054235458374023, 1.0721807479858398, 1.1389378309249878, 1.2056949138641357, 1.2724519968032837, 1.3392090797424316, 1.4059662818908691, 1.472723364830017, 1.539480447769165, 1.6062376499176025, 1.6729947328567505, 1.7397518157958984, 1.8065088987350464, 1.8732659816741943, 1.9400231838226318, 2.0067801475524902, 2.0735373497009277, 2.1402945518493652, 2.2070515155792236, 2.273808717727661]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 12.0, 19.0, 24.0, 35.0, 38.0, 48.0, 67.0, 80.0, 98.0, 78.0, 92.0, 67.0, 70.0, 63.0, 37.0, 41.0, 30.0, 26.0, 17.0, 15.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5990517735481262, -0.5756936073303223, -0.5523354411125183, -0.5289772748947144, -0.5056191086769104, -0.48226094245910645, -0.4589027762413025, -0.43554461002349854, -0.4121864438056946, -0.3888282775878906, -0.36547011137008667, -0.3421119451522827, -0.31875377893447876, -0.2953956127166748, -0.27203744649887085, -0.2486792653799057, -0.22532108426094055, -0.2019629180431366, -0.17860475182533264, -0.1552465856075287, -0.13188841938972473, -0.10853024572134018, -0.08517207205295563, -0.06181390583515167, -0.03845573961734772, -0.015097571536898613, 0.008260596543550491, 0.031618766486644745, 0.0549769327044487, 0.07833509892225266, 0.10169327259063721, 0.12505143880844116, 0.14840960502624512, 0.17176777124404907, 0.19512593746185303, 0.21848410367965698, 0.24184226989746094, 0.2652004361152649, 0.28855860233306885, 0.3119167685508728, 0.33527493476867676, 0.3586331009864807, 0.38199126720428467, 0.4053494334220886, 0.4287075996398926, 0.45206576585769653, 0.4754239320755005, 0.49878209829330444, 0.5221402645111084, 0.5454984307289124, 0.5688565969467163, 0.5922147631645203, 0.6155729293823242, 0.6389310956001282, 0.6622892618179321, 0.6856474280357361, 0.7090056538581848, 0.7323638200759888, 0.7557219862937927, 0.7790801525115967, 0.8024383187294006, 0.8257964849472046, 0.8491546511650085, 0.8725128173828125, 0.8958709836006165]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 6.0, 6.0, 5.0, 7.0, 13.0, 25.0, 15.0, 23.0, 39.0, 59.0, 74.0, 120.0, 154.0, 256.0, 412.0, 670.0, 1316.0, 2903.0, 8057.0, 26664.0, 113082.0, 480292.0, 319815.0, 66865.0, 17218.0, 5661.0, 2168.0, 1056.0, 547.0, 307.0, 192.0, 133.0, 110.0, 79.0, 57.0, 40.0, 22.0, 26.0, 17.0, 9.0, 7.0, 7.0, 5.0, 6.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.372802734375, -0.3617820739746094, -0.35076141357421875, -0.3397407531738281, -0.3287200927734375, -0.3176994323730469, -0.30667877197265625, -0.2956581115722656, -0.284637451171875, -0.2736167907714844, -0.26259613037109375, -0.2515754699707031, -0.2405548095703125, -0.22953414916992188, -0.21851348876953125, -0.20749282836914062, -0.19647216796875, -0.18545150756835938, -0.17443084716796875, -0.16341018676757812, -0.1523895263671875, -0.14136886596679688, -0.13034820556640625, -0.11932754516601562, -0.108306884765625, -0.09728622436523438, -0.08626556396484375, -0.07524490356445312, -0.0642242431640625, -0.053203582763671875, -0.04218292236328125, -0.031162261962890625, -0.0201416015625, -0.009120941162109375, 0.00189971923828125, 0.012920379638671875, 0.0239410400390625, 0.034961700439453125, 0.04598236083984375, 0.057003021240234375, 0.068023681640625, 0.07904434204101562, 0.09006500244140625, 0.10108566284179688, 0.1121063232421875, 0.12312698364257812, 0.13414764404296875, 0.14516830444335938, 0.15618896484375, 0.16720962524414062, 0.17823028564453125, 0.18925094604492188, 0.2002716064453125, 0.21129226684570312, 0.22231292724609375, 0.23333358764648438, 0.244354248046875, 0.2553749084472656, 0.26639556884765625, 0.2774162292480469, 0.2884368896484375, 0.2994575500488281, 0.31047821044921875, 0.3214988708496094, 0.33251953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 8.0, 17.0, 23.0, 31.0, 39.0, 62.0, 67.0, 86.0, 98.0, 99.0, 101.0, 77.0, 72.0, 75.0, 53.0, 24.0, 30.0, 15.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2081298828125, -0.2022876739501953, -0.19644546508789062, -0.19060325622558594, -0.18476104736328125, -0.17891883850097656, -0.17307662963867188, -0.1672344207763672, -0.1613922119140625, -0.1555500030517578, -0.14970779418945312, -0.14386558532714844, -0.13802337646484375, -0.13218116760253906, -0.12633895874023438, -0.12049674987792969, -0.114654541015625, -0.10881233215332031, -0.10297012329101562, -0.09712791442871094, -0.09128570556640625, -0.08544349670410156, -0.07960128784179688, -0.07375907897949219, -0.0679168701171875, -0.06207466125488281, -0.056232452392578125, -0.05039024353027344, -0.04454803466796875, -0.03870582580566406, -0.032863616943359375, -0.027021408081054688, -0.02117919921875, -0.015336990356445312, -0.009494781494140625, -0.0036525726318359375, 0.00218963623046875, 0.008031845092773438, 0.013874053955078125, 0.019716262817382812, 0.0255584716796875, 0.03140068054199219, 0.037242889404296875, 0.04308509826660156, 0.04892730712890625, 0.05476951599121094, 0.060611724853515625, 0.06645393371582031, 0.072296142578125, 0.07813835144042969, 0.08398056030273438, 0.08982276916503906, 0.09566497802734375, 0.10150718688964844, 0.10734939575195312, 0.11319160461425781, 0.1190338134765625, 0.12487602233886719, 0.13071823120117188, 0.13656044006347656, 0.14240264892578125, 0.14824485778808594, 0.15408706665039062, 0.1599292755126953, 0.165771484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 14.0, 12.0, 16.0, 22.0, 39.0, 27.0, 58.0, 82.0, 106.0, 193.0, 261.0, 449.0, 772.0, 1434.0, 3392.0, 9689.0, 36643.0, 172237.0, 541195.0, 218324.0, 44475.0, 11483.0, 3875.0, 1645.0, 808.0, 408.0, 242.0, 183.0, 145.0, 82.0, 53.0, 50.0, 36.0, 25.0, 25.0, 13.0, 9.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2442626953125, -0.23627281188964844, -0.22828292846679688, -0.2202930450439453, -0.21230316162109375, -0.2043132781982422, -0.19632339477539062, -0.18833351135253906, -0.1803436279296875, -0.17235374450683594, -0.16436386108398438, -0.1563739776611328, -0.14838409423828125, -0.1403942108154297, -0.13240432739257812, -0.12441444396972656, -0.116424560546875, -0.10843467712402344, -0.10044479370117188, -0.09245491027832031, -0.08446502685546875, -0.07647514343261719, -0.06848526000976562, -0.06049537658691406, -0.0525054931640625, -0.04451560974121094, -0.036525726318359375, -0.028535842895507812, -0.02054595947265625, -0.012556076049804688, -0.004566192626953125, 0.0034236907958984375, 0.01141357421875, 0.019403457641601562, 0.027393341064453125, 0.03538322448730469, 0.04337310791015625, 0.05136299133300781, 0.059352874755859375, 0.06734275817871094, 0.0753326416015625, 0.08332252502441406, 0.09131240844726562, 0.09930229187011719, 0.10729217529296875, 0.11528205871582031, 0.12327194213867188, 0.13126182556152344, 0.139251708984375, 0.14724159240722656, 0.15523147583007812, 0.1632213592529297, 0.17121124267578125, 0.1792011260986328, 0.18719100952148438, 0.19518089294433594, 0.2031707763671875, 0.21116065979003906, 0.21915054321289062, 0.2271404266357422, 0.23513031005859375, 0.2431201934814453, 0.2511100769042969, 0.25909996032714844, 0.26708984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 8.0, 11.0, 14.0, 22.0, 22.0, 25.0, 26.0, 27.0, 34.0, 32.0, 29.0, 38.0, 36.0, 40.0, 39.0, 42.0, 59.0, 41.0, 44.0, 45.0, 42.0, 45.0, 37.0, 32.0, 35.0, 15.0, 21.0, 26.0, 15.0, 16.0, 13.0, 12.0, 12.0, 7.0, 4.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.433837890625, -0.42200469970703125, -0.4101715087890625, -0.39833831787109375, -0.386505126953125, -0.37467193603515625, -0.3628387451171875, -0.35100555419921875, -0.33917236328125, -0.32733917236328125, -0.3155059814453125, -0.30367279052734375, -0.291839599609375, -0.28000640869140625, -0.2681732177734375, -0.25634002685546875, -0.2445068359375, -0.23267364501953125, -0.2208404541015625, -0.20900726318359375, -0.197174072265625, -0.18534088134765625, -0.1735076904296875, -0.16167449951171875, -0.14984130859375, -0.13800811767578125, -0.1261749267578125, -0.11434173583984375, -0.102508544921875, -0.09067535400390625, -0.0788421630859375, -0.06700897216796875, -0.05517578125, -0.04334259033203125, -0.0315093994140625, -0.01967620849609375, -0.007843017578125, 0.00399017333984375, 0.0158233642578125, 0.02765655517578125, 0.03948974609375, 0.05132293701171875, 0.0631561279296875, 0.07498931884765625, 0.086822509765625, 0.09865570068359375, 0.1104888916015625, 0.12232208251953125, 0.1341552734375, 0.14598846435546875, 0.1578216552734375, 0.16965484619140625, 0.181488037109375, 0.19332122802734375, 0.2051544189453125, 0.21698760986328125, 0.22882080078125, 0.24065399169921875, 0.2524871826171875, 0.26432037353515625, 0.276153564453125, 0.28798675537109375, 0.2998199462890625, 0.31165313720703125, 0.323486328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 11.0, 36.0, 102.0, 415.0, 5786.0, 924535.0, 115932.0, 1462.0, 199.0, 40.0, 20.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52197265625, -0.50738525390625, -0.4927978515625, -0.47821044921875, -0.463623046875, -0.44903564453125, -0.4344482421875, -0.41986083984375, -0.4052734375, -0.39068603515625, -0.3760986328125, -0.36151123046875, -0.346923828125, -0.33233642578125, -0.3177490234375, -0.30316162109375, -0.28857421875, -0.27398681640625, -0.2593994140625, -0.24481201171875, -0.230224609375, -0.21563720703125, -0.2010498046875, -0.18646240234375, -0.171875, -0.15728759765625, -0.1427001953125, -0.12811279296875, -0.113525390625, -0.09893798828125, -0.0843505859375, -0.06976318359375, -0.05517578125, -0.04058837890625, -0.0260009765625, -0.01141357421875, 0.003173828125, 0.01776123046875, 0.0323486328125, 0.04693603515625, 0.0615234375, 0.07611083984375, 0.0906982421875, 0.10528564453125, 0.119873046875, 0.13446044921875, 0.1490478515625, 0.16363525390625, 0.17822265625, 0.19281005859375, 0.2073974609375, 0.22198486328125, 0.236572265625, 0.25115966796875, 0.2657470703125, 0.28033447265625, 0.294921875, 0.30950927734375, 0.3240966796875, 0.33868408203125, 0.353271484375, 0.36785888671875, 0.3824462890625, 0.39703369140625, 0.41162109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 10.0, 27.0, 32.0, 53.0, 93.0, 109.0, 220.0, 176.0, 100.0, 65.0, 47.0, 34.0, 16.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002999305725097656, -0.00028908252716064453, -0.00027823448181152344, -0.00026738643646240234, -0.00025653839111328125, -0.00024569034576416016, -0.00023484230041503906, -0.00022399425506591797, -0.00021314620971679688, -0.00020229816436767578, -0.0001914501190185547, -0.0001806020736694336, -0.0001697540283203125, -0.0001589059829711914, -0.0001480579376220703, -0.00013720989227294922, -0.00012636184692382812, -0.00011551380157470703, -0.00010466575622558594, -9.381771087646484e-05, -8.296966552734375e-05, -7.212162017822266e-05, -6.127357482910156e-05, -5.042552947998047e-05, -3.9577484130859375e-05, -2.872943878173828e-05, -1.7881393432617188e-05, -7.033348083496094e-06, 3.814697265625e-06, 1.4662742614746094e-05, 2.5510787963867188e-05, 3.635883331298828e-05, 4.7206878662109375e-05, 5.805492401123047e-05, 6.890296936035156e-05, 7.975101470947266e-05, 9.059906005859375e-05, 0.00010144710540771484, 0.00011229515075683594, 0.00012314319610595703, 0.00013399124145507812, 0.00014483928680419922, 0.0001556873321533203, 0.0001665353775024414, 0.0001773834228515625, 0.0001882314682006836, 0.0001990795135498047, 0.00020992755889892578, 0.00022077560424804688, 0.00023162364959716797, 0.00024247169494628906, 0.00025331974029541016, 0.00026416778564453125, 0.00027501583099365234, 0.00028586387634277344, 0.00029671192169189453, 0.0003075599670410156, 0.0003184080123901367, 0.0003292560577392578, 0.0003401041030883789, 0.0003509521484375, 0.0003618001937866211, 0.0003726482391357422, 0.0003834962844848633, 0.0003943443298339844]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 20.0, 29.0, 56.0, 111.0, 200.0, 553.0, 2651.0, 41972.0, 873104.0, 123915.0, 4685.0, 766.0, 221.0, 105.0, 64.0, 38.0, 15.0, 15.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.29278564453125, -0.2838134765625, -0.27484130859375, -0.265869140625, -0.25689697265625, -0.2479248046875, -0.23895263671875, -0.22998046875, -0.22100830078125, -0.2120361328125, -0.20306396484375, -0.194091796875, -0.18511962890625, -0.1761474609375, -0.16717529296875, -0.158203125, -0.14923095703125, -0.1402587890625, -0.13128662109375, -0.122314453125, -0.11334228515625, -0.1043701171875, -0.09539794921875, -0.08642578125, -0.07745361328125, -0.0684814453125, -0.05950927734375, -0.050537109375, -0.04156494140625, -0.0325927734375, -0.02362060546875, -0.0146484375, -0.00567626953125, 0.0032958984375, 0.01226806640625, 0.021240234375, 0.03021240234375, 0.0391845703125, 0.04815673828125, 0.05712890625, 0.06610107421875, 0.0750732421875, 0.08404541015625, 0.093017578125, 0.10198974609375, 0.1109619140625, 0.11993408203125, 0.12890625, 0.13787841796875, 0.1468505859375, 0.15582275390625, 0.164794921875, 0.17376708984375, 0.1827392578125, 0.19171142578125, 0.20068359375, 0.20965576171875, 0.2186279296875, 0.22760009765625, 0.236572265625, 0.24554443359375, 0.2545166015625, 0.26348876953125, 0.2724609375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 17.0, 50.0, 106.0, 186.0, 244.0, 204.0, 119.0, 50.0, 12.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.56689453125, -0.5556869506835938, -0.5444793701171875, -0.5332717895507812, -0.522064208984375, -0.5108566284179688, -0.4996490478515625, -0.48844146728515625, -0.47723388671875, -0.46602630615234375, -0.4548187255859375, -0.44361114501953125, -0.432403564453125, -0.42119598388671875, -0.4099884033203125, -0.39878082275390625, -0.3875732421875, -0.37636566162109375, -0.3651580810546875, -0.35395050048828125, -0.342742919921875, -0.33153533935546875, -0.3203277587890625, -0.30912017822265625, -0.29791259765625, -0.28670501708984375, -0.2754974365234375, -0.26428985595703125, -0.253082275390625, -0.24187469482421875, -0.2306671142578125, -0.21945953369140625, -0.208251953125, -0.19704437255859375, -0.1858367919921875, -0.17462921142578125, -0.163421630859375, -0.15221405029296875, -0.1410064697265625, -0.12979888916015625, -0.11859130859375, -0.10738372802734375, -0.0961761474609375, -0.08496856689453125, -0.073760986328125, -0.06255340576171875, -0.0513458251953125, -0.04013824462890625, -0.0289306640625, -0.01772308349609375, -0.0065155029296875, 0.00469207763671875, 0.015899658203125, 0.02710723876953125, 0.0383148193359375, 0.04952239990234375, 0.06072998046875, 0.07193756103515625, 0.0831451416015625, 0.09435272216796875, 0.105560302734375, 0.11676788330078125, 0.1279754638671875, 0.13918304443359375, 0.150390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 8.0, 21.0, 31.0, 103.0, 245.0, 277.0, 187.0, 79.0, 30.0, 9.0, 4.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.837831020355225, -5.712147235870361, -5.586463451385498, -5.460780143737793, -5.33509635925293, -5.209412574768066, -5.083728790283203, -4.95804500579834, -4.832361221313477, -4.706677436828613, -4.58099365234375, -4.455310344696045, -4.329626560211182, -4.203942775726318, -4.078258991241455, -3.952575206756592, -3.8268918991088867, -3.7012081146240234, -3.5755245685577393, -3.449840784072876, -3.324157238006592, -3.1984734535217285, -3.0727896690368652, -2.947105884552002, -2.8214223384857178, -2.6957385540008545, -2.5700550079345703, -2.444371223449707, -2.3186874389648438, -2.1930038928985596, -2.0673201084136963, -1.9416364431381226, -1.815953254699707, -1.6902695894241333, -1.5645859241485596, -1.4389021396636963, -1.3132184743881226, -1.1875348091125488, -1.0618510246276855, -0.9361673593521118, -0.8104836940765381, -0.6848000288009644, -0.5591163039207458, -0.43343260884284973, -0.3077489137649536, -0.18206524848937988, -0.05638152360916138, 0.06930220127105713, 0.19498586654663086, 0.320669561624527, 0.4463532567024231, 0.5720369815826416, 0.6977206468582153, 0.8234043121337891, 0.9490880370140076, 1.074771761894226, 1.2004554271697998, 1.3261390924453735, 1.4518227577209473, 1.5775065422058105, 1.7031902074813843, 1.828873872756958, 1.9545576572418213, 2.0802412033081055, 2.2059249877929688]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 11.0, 6.0, 7.0, 11.0, 15.0, 13.0, 13.0, 18.0, 20.0, 21.0, 25.0, 28.0, 35.0, 32.0, 41.0, 41.0, 40.0, 27.0, 31.0, 42.0, 45.0, 40.0, 43.0, 43.0, 41.0, 30.0, 26.0, 31.0, 38.0, 28.0, 17.0, 21.0, 20.0, 13.0, 22.0, 12.0, 9.0, 12.0, 8.0, 11.0, 9.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.745201587677002, -1.6897183656692505, -1.6342350244522095, -1.578751802444458, -1.523268461227417, -1.4677852392196655, -1.412302017211914, -1.356818675994873, -1.3013354539871216, -1.2458522319793701, -1.190368890762329, -1.1348856687545776, -1.0794024467468262, -1.0239191055297852, -0.9684358835220337, -0.9129526019096375, -0.8574693202972412, -0.801986038684845, -0.7465027570724487, -0.6910195350646973, -0.635536253452301, -0.5800529718399048, -0.5245697498321533, -0.4690864682197571, -0.41360318660736084, -0.3581199049949646, -0.30263665318489075, -0.2471533864736557, -0.19167011976242065, -0.13618683815002441, -0.08070358633995056, -0.02522033452987671, 0.03026282787322998, 0.08574609458446503, 0.14122936129570007, 0.19671262800693512, 0.25219589471817017, 0.3076791763305664, 0.36316242814064026, 0.4186456799507141, 0.47412896156311035, 0.5296122431755066, 0.5850955247879028, 0.6405787467956543, 0.6960620284080505, 0.7515453100204468, 0.8070285320281982, 0.8625118136405945, 0.9179950952529907, 0.973478376865387, 1.0289616584777832, 1.0844448804855347, 1.1399281024932861, 1.1954114437103271, 1.2508946657180786, 1.30637788772583, 1.361861228942871, 1.4173444509506226, 1.4728277921676636, 1.528311014175415, 1.583794355392456, 1.6392775774002075, 1.694760799407959, 1.750244140625, 1.8057273626327515]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 7.0, 5.0, 9.0, 4.0, 13.0, 20.0, 14.0, 33.0, 58.0, 58.0, 141.0, 270.0, 485.0, 965.0, 2115.0, 5613.0, 18651.0, 155817.0, 3941878.0, 50926.0, 10419.0, 3612.0, 1532.0, 708.0, 356.0, 193.0, 99.0, 87.0, 58.0, 33.0, 30.0, 19.0, 15.0, 9.0, 13.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.74267578125, -0.7216339111328125, -0.700592041015625, -0.6795501708984375, -0.65850830078125, -0.6374664306640625, -0.616424560546875, -0.5953826904296875, -0.5743408203125, -0.5532989501953125, -0.532257080078125, -0.5112152099609375, -0.49017333984375, -0.4691314697265625, -0.448089599609375, -0.4270477294921875, -0.406005859375, -0.3849639892578125, -0.363922119140625, -0.3428802490234375, -0.32183837890625, -0.3007965087890625, -0.279754638671875, -0.2587127685546875, -0.2376708984375, -0.2166290283203125, -0.195587158203125, -0.1745452880859375, -0.15350341796875, -0.1324615478515625, -0.111419677734375, -0.0903778076171875, -0.0693359375, -0.0482940673828125, -0.027252197265625, -0.0062103271484375, 0.01483154296875, 0.0358734130859375, 0.056915283203125, 0.0779571533203125, 0.0989990234375, 0.1200408935546875, 0.141082763671875, 0.1621246337890625, 0.18316650390625, 0.2042083740234375, 0.225250244140625, 0.2462921142578125, 0.267333984375, 0.2883758544921875, 0.309417724609375, 0.3304595947265625, 0.35150146484375, 0.3725433349609375, 0.393585205078125, 0.4146270751953125, 0.4356689453125, 0.4567108154296875, 0.477752685546875, 0.4987945556640625, 0.51983642578125, 0.5408782958984375, 0.561920166015625, 0.5829620361328125, 0.60400390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 18.0, 23.0, 42.0, 44.0, 60.0, 70.0, 71.0, 83.0, 88.0, 75.0, 75.0, 70.0, 74.0, 61.0, 34.0, 27.0, 26.0, 18.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2109375, -0.205047607421875, -0.19915771484375, -0.193267822265625, -0.1873779296875, -0.181488037109375, -0.17559814453125, -0.169708251953125, -0.163818359375, -0.157928466796875, -0.15203857421875, -0.146148681640625, -0.1402587890625, -0.134368896484375, -0.12847900390625, -0.122589111328125, -0.11669921875, -0.110809326171875, -0.10491943359375, -0.099029541015625, -0.0931396484375, -0.087249755859375, -0.08135986328125, -0.075469970703125, -0.069580078125, -0.063690185546875, -0.05780029296875, -0.051910400390625, -0.0460205078125, -0.040130615234375, -0.03424072265625, -0.028350830078125, -0.0224609375, -0.016571044921875, -0.01068115234375, -0.004791259765625, 0.0010986328125, 0.006988525390625, 0.01287841796875, 0.018768310546875, 0.024658203125, 0.030548095703125, 0.03643798828125, 0.042327880859375, 0.0482177734375, 0.054107666015625, 0.05999755859375, 0.065887451171875, 0.07177734375, 0.077667236328125, 0.08355712890625, 0.089447021484375, 0.0953369140625, 0.101226806640625, 0.10711669921875, 0.113006591796875, 0.118896484375, 0.124786376953125, 0.13067626953125, 0.136566162109375, 0.1424560546875, 0.148345947265625, 0.15423583984375, 0.160125732421875, 0.166015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 4.0, 10.0, 21.0, 22.0, 55.0, 60.0, 96.0, 157.0, 270.0, 430.0, 831.0, 1732.0, 4578.0, 20253.0, 389999.0, 3727023.0, 37437.0, 6777.0, 2179.0, 995.0, 523.0, 296.0, 171.0, 130.0, 81.0, 48.0, 36.0, 20.0, 19.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5810546875, -0.5624008178710938, -0.5437469482421875, -0.5250930786132812, -0.506439208984375, -0.48778533935546875, -0.4691314697265625, -0.45047760009765625, -0.43182373046875, -0.41316986083984375, -0.3945159912109375, -0.37586212158203125, -0.357208251953125, -0.33855438232421875, -0.3199005126953125, -0.30124664306640625, -0.2825927734375, -0.26393890380859375, -0.2452850341796875, -0.22663116455078125, -0.207977294921875, -0.18932342529296875, -0.1706695556640625, -0.15201568603515625, -0.13336181640625, -0.11470794677734375, -0.0960540771484375, -0.07740020751953125, -0.058746337890625, -0.04009246826171875, -0.0214385986328125, -0.00278472900390625, 0.015869140625, 0.03452301025390625, 0.0531768798828125, 0.07183074951171875, 0.090484619140625, 0.10913848876953125, 0.1277923583984375, 0.14644622802734375, 0.16510009765625, 0.18375396728515625, 0.2024078369140625, 0.22106170654296875, 0.239715576171875, 0.25836944580078125, 0.2770233154296875, 0.29567718505859375, 0.3143310546875, 0.33298492431640625, 0.3516387939453125, 0.37029266357421875, 0.388946533203125, 0.40760040283203125, 0.4262542724609375, 0.44490814208984375, 0.46356201171875, 0.48221588134765625, 0.5008697509765625, 0.5195236206054688, 0.538177490234375, 0.5568313598632812, 0.5754852294921875, 0.5941390991210938, 0.61279296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 11.0, 8.0, 14.0, 16.0, 45.0, 86.0, 506.0, 3039.0, 225.0, 66.0, 24.0, 12.0, 8.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5318679809570312, -0.5183258056640625, -0.5047836303710938, -0.491241455078125, -0.47769927978515625, -0.4641571044921875, -0.45061492919921875, -0.43707275390625, -0.42353057861328125, -0.4099884033203125, -0.39644622802734375, -0.382904052734375, -0.36936187744140625, -0.3558197021484375, -0.34227752685546875, -0.3287353515625, -0.31519317626953125, -0.3016510009765625, -0.28810882568359375, -0.274566650390625, -0.26102447509765625, -0.2474822998046875, -0.23394012451171875, -0.22039794921875, -0.20685577392578125, -0.1933135986328125, -0.17977142333984375, -0.166229248046875, -0.15268707275390625, -0.1391448974609375, -0.12560272216796875, -0.112060546875, -0.09851837158203125, -0.0849761962890625, -0.07143402099609375, -0.057891845703125, -0.04434967041015625, -0.0308074951171875, -0.01726531982421875, -0.00372314453125, 0.00981903076171875, 0.0233612060546875, 0.03690338134765625, 0.050445556640625, 0.06398773193359375, 0.0775299072265625, 0.09107208251953125, 0.1046142578125, 0.11815643310546875, 0.1316986083984375, 0.14524078369140625, 0.158782958984375, 0.17232513427734375, 0.1858673095703125, 0.19940948486328125, 0.21295166015625, 0.22649383544921875, 0.2400360107421875, 0.25357818603515625, 0.267120361328125, 0.28066253662109375, 0.2942047119140625, 0.30774688720703125, 0.3212890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 14.0, 36.0, 170.0, 467.0, 232.0, 49.0, 7.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.968031883239746, -3.87689208984375, -3.785752296447754, -3.694612503051758, -3.6034727096557617, -3.5123326778411865, -3.4211928844451904, -3.3300530910491943, -3.2389132976531982, -3.147773504257202, -3.056633710861206, -2.96549391746521, -2.8743538856506348, -2.7832140922546387, -2.6920742988586426, -2.6009345054626465, -2.5097947120666504, -2.4186549186706543, -2.327515125274658, -2.236375331878662, -2.145235538482666, -2.054095506668091, -1.9629557132720947, -1.8718159198760986, -1.7806761264801025, -1.6895363330841064, -1.5983965396881104, -1.5072566270828247, -1.4161168336868286, -1.3249770402908325, -1.2338371276855469, -1.1426973342895508, -1.0515577793121338, -0.9604179859161377, -0.8692781329154968, -0.778138279914856, -0.6869984865188599, -0.5958586931228638, -0.5047188401222229, -0.41357898712158203, -0.32243919372558594, -0.23129937052726746, -0.14015954732894897, -0.04901972413063049, 0.04212009906768799, 0.13325992226600647, 0.22439974546432495, 0.3155395984649658, 0.4066793918609619, 0.4978192150592804, 0.5889590382575989, 0.6800988912582397, 0.7712386846542358, 0.8623784780502319, 0.9535183310508728, 1.0446581840515137, 1.1357979774475098, 1.2269377708435059, 1.318077564239502, 1.4092174768447876, 1.5003572702407837, 1.5914970636367798, 1.6826369762420654, 1.7737767696380615, 1.8649165630340576]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 6.0, 4.0, 5.0, 9.0, 10.0, 15.0, 17.0, 16.0, 31.0, 31.0, 36.0, 42.0, 50.0, 54.0, 49.0, 68.0, 59.0, 54.0, 59.0, 40.0, 46.0, 57.0, 39.0, 33.0, 30.0, 27.0, 31.0, 25.0, 18.0, 13.0, 5.0, 9.0, 7.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6551198363304138, -0.6312218904495239, -0.6073240041732788, -0.5834261178970337, -0.5595281720161438, -0.5356302261352539, -0.5117323398590088, -0.4878344237804413, -0.4639365077018738, -0.4400385916233063, -0.41614067554473877, -0.39224275946617126, -0.36834484338760376, -0.34444692730903625, -0.32054901123046875, -0.29665109515190125, -0.27275317907333374, -0.24885526299476624, -0.22495734691619873, -0.20105943083763123, -0.17716151475906372, -0.15326359868049622, -0.1293656826019287, -0.1054677665233612, -0.0815698504447937, -0.057671934366226196, -0.03377401828765869, -0.009876102209091187, 0.014021813869476318, 0.03791972994804382, 0.06181764602661133, 0.08571556210517883, 0.10961341857910156, 0.13351133465766907, 0.15740925073623657, 0.18130716681480408, 0.20520508289337158, 0.2291029989719391, 0.2530009150505066, 0.2768988311290741, 0.3007967472076416, 0.3246946632862091, 0.3485925793647766, 0.3724904954433441, 0.3963884115219116, 0.4202863276004791, 0.44418424367904663, 0.46808215975761414, 0.49198007583618164, 0.5158779621124268, 0.5397759079933167, 0.5636738538742065, 0.5875717401504517, 0.6114696264266968, 0.6353675723075867, 0.6592655181884766, 0.6831634044647217, 0.7070612907409668, 0.7309592366218567, 0.7548571825027466, 0.7787550687789917, 0.8026529550552368, 0.8265509009361267, 0.8504488468170166, 0.8743467330932617]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 13.0, 21.0, 25.0, 44.0, 90.0, 195.0, 371.0, 995.0, 3540.0, 28818.0, 684001.0, 312748.0, 14004.0, 2321.0, 719.0, 309.0, 157.0, 90.0, 31.0, 20.0, 13.0, 12.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85888671875, -0.8335189819335938, -0.8081512451171875, -0.7827835083007812, -0.757415771484375, -0.7320480346679688, -0.7066802978515625, -0.6813125610351562, -0.65594482421875, -0.6305770874023438, -0.6052093505859375, -0.5798416137695312, -0.554473876953125, -0.5291061401367188, -0.5037384033203125, -0.47837066650390625, -0.4530029296875, -0.42763519287109375, -0.4022674560546875, -0.37689971923828125, -0.351531982421875, -0.32616424560546875, -0.3007965087890625, -0.27542877197265625, -0.25006103515625, -0.22469329833984375, -0.1993255615234375, -0.17395782470703125, -0.148590087890625, -0.12322235107421875, -0.0978546142578125, -0.07248687744140625, -0.047119140625, -0.02175140380859375, 0.0036163330078125, 0.02898406982421875, 0.054351806640625, 0.07971954345703125, 0.1050872802734375, 0.13045501708984375, 0.15582275390625, 0.18119049072265625, 0.2065582275390625, 0.23192596435546875, 0.257293701171875, 0.28266143798828125, 0.3080291748046875, 0.33339691162109375, 0.3587646484375, 0.38413238525390625, 0.4095001220703125, 0.43486785888671875, 0.460235595703125, 0.48560333251953125, 0.5109710693359375, 0.5363388061523438, 0.56170654296875, 0.5870742797851562, 0.6124420166015625, 0.6378097534179688, 0.663177490234375, 0.6885452270507812, 0.7139129638671875, 0.7392807006835938, 0.7646484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 34.0, 44.0, 57.0, 74.0, 64.0, 72.0, 73.0, 91.0, 87.0, 88.0, 53.0, 66.0, 56.0, 29.0, 24.0, 12.0, 17.0, 10.0, 0.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221435546875, -0.21514892578125, -0.2088623046875, -0.20257568359375, -0.1962890625, -0.19000244140625, -0.1837158203125, -0.17742919921875, -0.171142578125, -0.16485595703125, -0.1585693359375, -0.15228271484375, -0.14599609375, -0.13970947265625, -0.1334228515625, -0.12713623046875, -0.120849609375, -0.11456298828125, -0.1082763671875, -0.10198974609375, -0.095703125, -0.08941650390625, -0.0831298828125, -0.07684326171875, -0.070556640625, -0.06427001953125, -0.0579833984375, -0.05169677734375, -0.04541015625, -0.03912353515625, -0.0328369140625, -0.02655029296875, -0.020263671875, -0.01397705078125, -0.0076904296875, -0.00140380859375, 0.0048828125, 0.01116943359375, 0.0174560546875, 0.02374267578125, 0.030029296875, 0.03631591796875, 0.0426025390625, 0.04888916015625, 0.05517578125, 0.06146240234375, 0.0677490234375, 0.07403564453125, 0.080322265625, 0.08660888671875, 0.0928955078125, 0.09918212890625, 0.10546875, 0.11175537109375, 0.1180419921875, 0.12432861328125, 0.130615234375, 0.13690185546875, 0.1431884765625, 0.14947509765625, 0.15576171875, 0.16204833984375, 0.1683349609375, 0.17462158203125, 0.180908203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 3.0, 3.0, 26.0, 18.0, 25.0, 48.0, 84.0, 137.0, 214.0, 388.0, 825.0, 2079.0, 7520.0, 49578.0, 583976.0, 364060.0, 30900.0, 5451.0, 1672.0, 716.0, 356.0, 181.0, 95.0, 64.0, 41.0, 34.0, 20.0, 15.0, 11.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.450927734375, -0.43721771240234375, -0.4235076904296875, -0.40979766845703125, -0.396087646484375, -0.38237762451171875, -0.3686676025390625, -0.35495758056640625, -0.34124755859375, -0.32753753662109375, -0.3138275146484375, -0.30011749267578125, -0.286407470703125, -0.27269744873046875, -0.2589874267578125, -0.24527740478515625, -0.2315673828125, -0.21785736083984375, -0.2041473388671875, -0.19043731689453125, -0.176727294921875, -0.16301727294921875, -0.1493072509765625, -0.13559722900390625, -0.12188720703125, -0.10817718505859375, -0.0944671630859375, -0.08075714111328125, -0.067047119140625, -0.05333709716796875, -0.0396270751953125, -0.02591705322265625, -0.01220703125, 0.00150299072265625, 0.0152130126953125, 0.02892303466796875, 0.042633056640625, 0.05634307861328125, 0.0700531005859375, 0.08376312255859375, 0.09747314453125, 0.11118316650390625, 0.1248931884765625, 0.13860321044921875, 0.152313232421875, 0.16602325439453125, 0.1797332763671875, 0.19344329833984375, 0.2071533203125, 0.22086334228515625, 0.2345733642578125, 0.24828338623046875, 0.261993408203125, 0.27570343017578125, 0.2894134521484375, 0.30312347412109375, 0.31683349609375, 0.33054351806640625, 0.3442535400390625, 0.35796356201171875, 0.371673583984375, 0.38538360595703125, 0.3990936279296875, 0.41280364990234375, 0.426513671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 4.0, 11.0, 12.0, 11.0, 12.0, 18.0, 33.0, 29.0, 36.0, 39.0, 58.0, 48.0, 47.0, 47.0, 64.0, 51.0, 56.0, 62.0, 49.0, 53.0, 44.0, 40.0, 26.0, 36.0, 25.0, 24.0, 23.0, 12.0, 4.0, 8.0, 8.0, 3.0, 8.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478271484375, -0.4603157043457031, -0.44235992431640625, -0.4244041442871094, -0.4064483642578125, -0.3884925842285156, -0.37053680419921875, -0.3525810241699219, -0.334625244140625, -0.3166694641113281, -0.29871368408203125, -0.2807579040527344, -0.2628021240234375, -0.24484634399414062, -0.22689056396484375, -0.20893478393554688, -0.19097900390625, -0.17302322387695312, -0.15506744384765625, -0.13711166381835938, -0.1191558837890625, -0.10120010375976562, -0.08324432373046875, -0.06528854370117188, -0.047332763671875, -0.029376983642578125, -0.01142120361328125, 0.006534576416015625, 0.0244903564453125, 0.042446136474609375, 0.06040191650390625, 0.07835769653320312, 0.0963134765625, 0.11426925659179688, 0.13222503662109375, 0.15018081665039062, 0.1681365966796875, 0.18609237670898438, 0.20404815673828125, 0.22200393676757812, 0.239959716796875, 0.2579154968261719, 0.27587127685546875, 0.2938270568847656, 0.3117828369140625, 0.3297386169433594, 0.34769439697265625, 0.3656501770019531, 0.38360595703125, 0.4015617370605469, 0.41951751708984375, 0.4374732971191406, 0.4554290771484375, 0.4733848571777344, 0.49134063720703125, 0.5092964172363281, 0.527252197265625, 0.5452079772949219, 0.5631637573242188, 0.5811195373535156, 0.5990753173828125, 0.6170310974121094, 0.6349868774414062, 0.6529426574707031, 0.6708984375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 20.0, 49.0, 90.0, 225.0, 667.0, 3176.0, 38517.0, 849630.0, 147948.0, 6530.0, 1113.0, 343.0, 118.0, 54.0, 26.0, 12.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.31324195861816406, -0.3044624328613281, -0.2956829071044922, -0.28690338134765625, -0.2781238555908203, -0.2693443298339844, -0.26056480407714844, -0.2517852783203125, -0.24300575256347656, -0.23422622680664062, -0.2254467010498047, -0.21666717529296875, -0.2078876495361328, -0.19910812377929688, -0.19032859802246094, -0.181549072265625, -0.17276954650878906, -0.16399002075195312, -0.1552104949951172, -0.14643096923828125, -0.1376514434814453, -0.12887191772460938, -0.12009239196777344, -0.1113128662109375, -0.10253334045410156, -0.09375381469726562, -0.08497428894042969, -0.07619476318359375, -0.06741523742675781, -0.058635711669921875, -0.04985618591308594, -0.04107666015625, -0.03229713439941406, -0.023517608642578125, -0.014738082885742188, -0.00595855712890625, 0.0028209686279296875, 0.011600494384765625, 0.020380020141601562, 0.0291595458984375, 0.03793907165527344, 0.046718597412109375, 0.05549812316894531, 0.06427764892578125, 0.07305717468261719, 0.08183670043945312, 0.09061622619628906, 0.099395751953125, 0.10817527770996094, 0.11695480346679688, 0.1257343292236328, 0.13451385498046875, 0.1432933807373047, 0.15207290649414062, 0.16085243225097656, 0.1696319580078125, 0.17841148376464844, 0.18719100952148438, 0.1959705352783203, 0.20475006103515625, 0.2135295867919922, 0.22230911254882812, 0.23108863830566406, 0.2398681640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 5.0, 12.0, 10.0, 15.0, 17.0, 21.0, 27.0, 33.0, 54.0, 63.0, 70.0, 101.0, 104.0, 93.0, 75.0, 58.0, 50.0, 36.0, 22.0, 27.0, 25.0, 15.0, 7.0, 16.0, 5.0, 7.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014388561248779297, -0.0001390315592288971, -0.00013417750597000122, -0.00012932345271110535, -0.00012446939945220947, -0.0001196153461933136, -0.00011476129293441772, -0.00010990723967552185, -0.00010505318641662598, -0.0001001991331577301, -9.534507989883423e-05, -9.049102663993835e-05, -8.563697338104248e-05, -8.07829201221466e-05, -7.592886686325073e-05, -7.107481360435486e-05, -6.622076034545898e-05, -6.136670708656311e-05, -5.6512653827667236e-05, -5.165860056877136e-05, -4.680454730987549e-05, -4.1950494050979614e-05, -3.709644079208374e-05, -3.2242387533187866e-05, -2.7388334274291992e-05, -2.2534281015396118e-05, -1.7680227756500244e-05, -1.282617449760437e-05, -7.972121238708496e-06, -3.118067979812622e-06, 1.735985279083252e-06, 6.590038537979126e-06, 1.1444091796875e-05, 1.6298145055770874e-05, 2.1152198314666748e-05, 2.6006251573562622e-05, 3.0860304832458496e-05, 3.571435809135437e-05, 4.0568411350250244e-05, 4.542246460914612e-05, 5.027651786804199e-05, 5.5130571126937866e-05, 5.998462438583374e-05, 6.483867764472961e-05, 6.969273090362549e-05, 7.454678416252136e-05, 7.940083742141724e-05, 8.425489068031311e-05, 8.910894393920898e-05, 9.396299719810486e-05, 9.881705045700073e-05, 0.0001036711037158966, 0.00010852515697479248, 0.00011337921023368835, 0.00011823326349258423, 0.0001230873167514801, 0.00012794137001037598, 0.00013279542326927185, 0.00013764947652816772, 0.0001425035297870636, 0.00014735758304595947, 0.00015221163630485535, 0.00015706568956375122, 0.0001619197428226471, 0.00016677379608154297]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 16.0, 17.0, 49.0, 88.0, 229.0, 715.0, 3580.0, 77920.0, 920452.0, 41801.0, 2787.0, 512.0, 223.0, 76.0, 41.0, 19.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.292236328125, -0.2819557189941406, -0.27167510986328125, -0.2613945007324219, -0.2511138916015625, -0.24083328247070312, -0.23055267333984375, -0.22027206420898438, -0.209991455078125, -0.19971084594726562, -0.18943023681640625, -0.17914962768554688, -0.1688690185546875, -0.15858840942382812, -0.14830780029296875, -0.13802719116210938, -0.12774658203125, -0.11746597290039062, -0.10718536376953125, -0.09690475463867188, -0.0866241455078125, -0.07634353637695312, -0.06606292724609375, -0.055782318115234375, -0.045501708984375, -0.035221099853515625, -0.02494049072265625, -0.014659881591796875, -0.0043792724609375, 0.005901336669921875, 0.01618194580078125, 0.026462554931640625, 0.0367431640625, 0.047023773193359375, 0.05730438232421875, 0.06758499145507812, 0.0778656005859375, 0.08814620971679688, 0.09842681884765625, 0.10870742797851562, 0.118988037109375, 0.12926864624023438, 0.13954925537109375, 0.14982986450195312, 0.1601104736328125, 0.17039108276367188, 0.18067169189453125, 0.19095230102539062, 0.20123291015625, 0.21151351928710938, 0.22179412841796875, 0.23207473754882812, 0.2423553466796875, 0.2526359558105469, 0.26291656494140625, 0.2731971740722656, 0.283477783203125, 0.2937583923339844, 0.30403900146484375, 0.3143196105957031, 0.3246002197265625, 0.3348808288574219, 0.34516143798828125, 0.3554420471191406, 0.36572265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 1.0, 4.0, 11.0, 8.0, 18.0, 47.0, 62.0, 130.0, 153.0, 187.0, 138.0, 93.0, 73.0, 36.0, 13.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14160728454589844, -0.13294601440429688, -0.12428474426269531, -0.11562347412109375, -0.10696220397949219, -0.09830093383789062, -0.08963966369628906, -0.0809783935546875, -0.07231712341308594, -0.06365585327148438, -0.05499458312988281, -0.04633331298828125, -0.03767204284667969, -0.029010772705078125, -0.020349502563476562, -0.011688232421875, -0.0030269622802734375, 0.005634307861328125, 0.014295578002929688, 0.02295684814453125, 0.03161811828613281, 0.040279388427734375, 0.04894065856933594, 0.0576019287109375, 0.06626319885253906, 0.07492446899414062, 0.08358573913574219, 0.09224700927734375, 0.10090827941894531, 0.10956954956054688, 0.11823081970214844, 0.12689208984375, 0.13555335998535156, 0.14421463012695312, 0.1528759002685547, 0.16153717041015625, 0.1701984405517578, 0.17885971069335938, 0.18752098083496094, 0.1961822509765625, 0.20484352111816406, 0.21350479125976562, 0.2221660614013672, 0.23082733154296875, 0.2394886016845703, 0.24814987182617188, 0.25681114196777344, 0.265472412109375, 0.27413368225097656, 0.2827949523925781, 0.2914562225341797, 0.30011749267578125, 0.3087787628173828, 0.3174400329589844, 0.32610130310058594, 0.3347625732421875, 0.34342384338378906, 0.3520851135253906, 0.3607463836669922, 0.36940765380859375, 0.3780689239501953, 0.3867301940917969, 0.39539146423339844, 0.404052734375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 28.0, 54.0, 112.0, 204.0, 240.0, 179.0, 94.0, 38.0, 13.0, 14.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6615819931030273, -3.5490167140960693, -3.4364516735076904, -3.3238863945007324, -3.2113211154937744, -3.0987558364868164, -2.9861907958984375, -2.8736255168914795, -2.7610602378845215, -2.6484949588775635, -2.5359299182891846, -2.4233646392822266, -2.3107993602752686, -2.1982340812683105, -2.0856690406799316, -1.9731037616729736, -1.8605386018753052, -1.7479734420776367, -1.6354081630706787, -1.5228430032730103, -1.4102777242660522, -1.2977125644683838, -1.1851472854614258, -1.0725821256637573, -0.9600169062614441, -0.8474516868591309, -0.7348864674568176, -0.6223212480545044, -0.5097560882568359, -0.3971908688545227, -0.2846256494522095, -0.17206043004989624, -0.05949521064758301, 0.05307000130414963, 0.16563521325588226, 0.2782004177570343, 0.39076563715934753, 0.5033308267593384, 0.6158960461616516, 0.7284612655639648, 0.8410264849662781, 0.9535917043685913, 1.0661568641662598, 1.1787221431732178, 1.2912873029708862, 1.4038524627685547, 1.5164177417755127, 1.6289830207824707, 1.7415481805801392, 1.8541133403778076, 1.9666786193847656, 2.0792438983917236, 2.1918089389801025, 2.3043742179870605, 2.4169394969940186, 2.5295047760009766, 2.6420698165893555, 2.7546350955963135, 2.8672001361846924, 2.9797654151916504, 3.0923306941986084, 3.2048959732055664, 3.3174610137939453, 3.4300262928009033, 3.5425915718078613]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 2.0, 7.0, 8.0, 13.0, 13.0, 17.0, 11.0, 19.0, 16.0, 24.0, 27.0, 23.0, 40.0, 38.0, 37.0, 38.0, 44.0, 43.0, 51.0, 42.0, 34.0, 37.0, 49.0, 45.0, 48.0, 36.0, 36.0, 16.0, 26.0, 26.0, 18.0, 20.0, 22.0, 12.0, 13.0, 7.0, 7.0, 7.0, 7.0, 0.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.4537458419799805, -2.3853323459625244, -2.3169188499450684, -2.2485053539276123, -2.1800918579101562, -2.111678123474121, -2.043264627456665, -1.974851131439209, -1.906437635421753, -1.8380241394042969, -1.7696106433868408, -1.7011970281600952, -1.6327835321426392, -1.564370036125183, -1.4959564208984375, -1.4275429248809814, -1.3591294288635254, -1.2907159328460693, -1.2223024368286133, -1.1538888216018677, -1.0854753255844116, -1.0170618295669556, -0.9486482739448547, -0.8802347183227539, -0.8118212223052979, -0.7434077262878418, -0.674994170665741, -0.6065806150436401, -0.5381671190261841, -0.46975359320640564, -0.4013400673866272, -0.33292654156684875, -0.2645127773284912, -0.19609925150871277, -0.12768572568893433, -0.059272199869155884, 0.009141325950622559, 0.077554851770401, 0.14596837759017944, 0.21438190340995789, 0.28279542922973633, 0.35120895504951477, 0.4196224808692932, 0.48803600668907166, 0.5564495325088501, 0.6248630285263062, 0.693276584148407, 0.7616901397705078, 0.8301036357879639, 0.8985171318054199, 0.9669306874275208, 1.0353442430496216, 1.1037577390670776, 1.1721712350845337, 1.2405848503112793, 1.3089983463287354, 1.3774118423461914, 1.4458253383636475, 1.5142388343811035, 1.5826524496078491, 1.6510659456253052, 1.7194794416427612, 1.7878930568695068, 1.856306552886963, 1.924720048904419]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 9.0, 4.0, 13.0, 14.0, 25.0, 45.0, 43.0, 100.0, 134.0, 201.0, 413.0, 1472.0, 39169.0, 4148656.0, 2715.0, 552.0, 290.0, 156.0, 88.0, 58.0, 43.0, 25.0, 16.0, 8.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6708984375, -1.6204986572265625, -1.570098876953125, -1.5196990966796875, -1.46929931640625, -1.4188995361328125, -1.368499755859375, -1.3180999755859375, -1.2677001953125, -1.2173004150390625, -1.166900634765625, -1.1165008544921875, -1.06610107421875, -1.0157012939453125, -0.965301513671875, -0.9149017333984375, -0.864501953125, -0.8141021728515625, -0.763702392578125, -0.7133026123046875, -0.66290283203125, -0.6125030517578125, -0.562103271484375, -0.5117034912109375, -0.4613037109375, -0.4109039306640625, -0.360504150390625, -0.3101043701171875, -0.25970458984375, -0.2093048095703125, -0.158905029296875, -0.1085052490234375, -0.05810546875, -0.0077056884765625, 0.042694091796875, 0.0930938720703125, 0.14349365234375, 0.1938934326171875, 0.244293212890625, 0.2946929931640625, 0.3450927734375, 0.3954925537109375, 0.445892333984375, 0.4962921142578125, 0.54669189453125, 0.5970916748046875, 0.647491455078125, 0.6978912353515625, 0.748291015625, 0.7986907958984375, 0.849090576171875, 0.8994903564453125, 0.94989013671875, 1.0002899169921875, 1.050689697265625, 1.1010894775390625, 1.1514892578125, 1.2018890380859375, 1.252288818359375, 1.3026885986328125, 1.35308837890625, 1.4034881591796875, 1.453887939453125, 1.5042877197265625, 1.5546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 2.0, 5.0, 5.0, 14.0, 16.0, 31.0, 28.0, 34.0, 37.0, 53.0, 68.0, 57.0, 63.0, 79.0, 76.0, 66.0, 72.0, 68.0, 56.0, 44.0, 31.0, 23.0, 15.0, 20.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.221923828125, -0.2158985137939453, -0.20987319946289062, -0.20384788513183594, -0.19782257080078125, -0.19179725646972656, -0.18577194213867188, -0.1797466278076172, -0.1737213134765625, -0.1676959991455078, -0.16167068481445312, -0.15564537048339844, -0.14962005615234375, -0.14359474182128906, -0.13756942749023438, -0.1315441131591797, -0.125518798828125, -0.11949348449707031, -0.11346817016601562, -0.10744285583496094, -0.10141754150390625, -0.09539222717285156, -0.08936691284179688, -0.08334159851074219, -0.0773162841796875, -0.07129096984863281, -0.06526565551757812, -0.05924034118652344, -0.05321502685546875, -0.04718971252441406, -0.041164398193359375, -0.03513908386230469, -0.02911376953125, -0.023088455200195312, -0.017063140869140625, -0.011037826538085938, -0.00501251220703125, 0.0010128021240234375, 0.007038116455078125, 0.013063430786132812, 0.0190887451171875, 0.025114059448242188, 0.031139373779296875, 0.03716468811035156, 0.04319000244140625, 0.04921531677246094, 0.055240631103515625, 0.06126594543457031, 0.067291259765625, 0.07331657409667969, 0.07934188842773438, 0.08536720275878906, 0.09139251708984375, 0.09741783142089844, 0.10344314575195312, 0.10946846008300781, 0.1154937744140625, 0.12151908874511719, 0.12754440307617188, 0.13356971740722656, 0.13959503173828125, 0.14562034606933594, 0.15164566040039062, 0.1576709747314453, 0.1636962890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 9.0, 5.0, 18.0, 22.0, 28.0, 39.0, 48.0, 80.0, 79.0, 115.0, 168.0, 248.0, 322.0, 526.0, 852.0, 1684.0, 3561.0, 9771.0, 52785.0, 4059514.0, 47402.0, 9372.0, 3562.0, 1592.0, 877.0, 495.0, 341.0, 231.0, 149.0, 124.0, 85.0, 44.0, 45.0, 19.0, 20.0, 12.0, 8.0, 10.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3459434509277344, -0.33495330810546875, -0.3239631652832031, -0.3129730224609375, -0.3019828796386719, -0.29099273681640625, -0.2800025939941406, -0.269012451171875, -0.2580223083496094, -0.24703216552734375, -0.23604202270507812, -0.2250518798828125, -0.21406173706054688, -0.20307159423828125, -0.19208145141601562, -0.18109130859375, -0.17010116577148438, -0.15911102294921875, -0.14812088012695312, -0.1371307373046875, -0.12614059448242188, -0.11515045166015625, -0.10416030883789062, -0.093170166015625, -0.08218002319335938, -0.07118988037109375, -0.060199737548828125, -0.0492095947265625, -0.038219451904296875, -0.02722930908203125, -0.016239166259765625, -0.0052490234375, 0.005741119384765625, 0.01673126220703125, 0.027721405029296875, 0.0387115478515625, 0.049701690673828125, 0.06069183349609375, 0.07168197631835938, 0.082672119140625, 0.09366226196289062, 0.10465240478515625, 0.11564254760742188, 0.1266326904296875, 0.13762283325195312, 0.14861297607421875, 0.15960311889648438, 0.17059326171875, 0.18158340454101562, 0.19257354736328125, 0.20356369018554688, 0.2145538330078125, 0.22554397583007812, 0.23653411865234375, 0.24752426147460938, 0.258514404296875, 0.2695045471191406, 0.28049468994140625, 0.2914848327636719, 0.3024749755859375, 0.3134651184082031, 0.32445526123046875, 0.3354454040527344, 0.346435546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 14.0, 23.0, 120.0, 3665.0, 164.0, 33.0, 18.0, 11.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15996646881103516, -0.1561145782470703, -0.15226268768310547, -0.14841079711914062, -0.14455890655517578, -0.14070701599121094, -0.1368551254272461, -0.13300323486328125, -0.1291513442993164, -0.12529945373535156, -0.12144756317138672, -0.11759567260742188, -0.11374378204345703, -0.10989189147949219, -0.10604000091552734, -0.1021881103515625, -0.09833621978759766, -0.09448432922363281, -0.09063243865966797, -0.08678054809570312, -0.08292865753173828, -0.07907676696777344, -0.0752248764038086, -0.07137298583984375, -0.0675210952758789, -0.06366920471191406, -0.05981731414794922, -0.055965423583984375, -0.05211353302001953, -0.04826164245605469, -0.044409751892089844, -0.040557861328125, -0.036705970764160156, -0.03285408020019531, -0.02900218963623047, -0.025150299072265625, -0.02129840850830078, -0.017446517944335938, -0.013594627380371094, -0.00974273681640625, -0.005890846252441406, -0.0020389556884765625, 0.0018129348754882812, 0.005664825439453125, 0.009516716003417969, 0.013368606567382812, 0.017220497131347656, 0.0210723876953125, 0.024924278259277344, 0.028776168823242188, 0.03262805938720703, 0.036479949951171875, 0.04033184051513672, 0.04418373107910156, 0.048035621643066406, 0.05188751220703125, 0.055739402770996094, 0.05959129333496094, 0.06344318389892578, 0.06729507446289062, 0.07114696502685547, 0.07499885559082031, 0.07885074615478516, 0.08270263671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 13.0, 21.0, 61.0, 105.0, 168.0, 239.0, 186.0, 102.0, 61.0, 21.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35893046855926514, -0.3456893265247345, -0.33244821429252625, -0.3192070722579956, -0.30596593022346497, -0.2927247881889343, -0.2794836759567261, -0.26624253392219543, -0.2530013918876648, -0.23976026475429535, -0.2265191227197647, -0.21327799558639526, -0.20003685355186462, -0.18679572641849518, -0.17355459928512573, -0.1603134572505951, -0.14707234501838684, -0.1338312178850174, -0.12059007585048676, -0.10734894871711731, -0.09410781413316727, -0.08086667954921722, -0.06762555241584778, -0.054384417831897736, -0.04114328324794769, -0.0279021505266428, -0.014661017805337906, -0.0014198869466781616, 0.011821247637271881, 0.025062382221221924, 0.03830350935459137, 0.05154464393854141, 0.06478574872016907, 0.07802688330411911, 0.09126801788806915, 0.1045091450214386, 0.11775027960538864, 0.13099141418933868, 0.14423254132270813, 0.15747368335723877, 0.17071481049060822, 0.18395593762397766, 0.1971970796585083, 0.21043820679187775, 0.2236793339252472, 0.23692047595977783, 0.2501615881919861, 0.2634027302265167, 0.27664387226104736, 0.289885014295578, 0.30312612652778625, 0.3163672685623169, 0.32960841059684753, 0.3428495526313782, 0.3560906648635864, 0.36933180689811707, 0.3825729489326477, 0.39581409096717834, 0.4090552031993866, 0.42229634523391724, 0.4355374872684479, 0.4487786293029785, 0.46201974153518677, 0.4752608835697174, 0.48850199580192566]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 8.0, 10.0, 8.0, 8.0, 25.0, 20.0, 16.0, 14.0, 28.0, 28.0, 33.0, 41.0, 29.0, 28.0, 34.0, 36.0, 43.0, 47.0, 35.0, 48.0, 49.0, 30.0, 32.0, 35.0, 33.0, 31.0, 35.0, 31.0, 32.0, 23.0, 21.0, 17.0, 15.0, 8.0, 7.0, 9.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15804731845855713, -0.15313029289245605, -0.1482132524251938, -0.1432962268590927, -0.13837918639183044, -0.13346216082572937, -0.1285451203584671, -0.12362809479236603, -0.11871106177568436, -0.11379402875900269, -0.10887699574232101, -0.10395996272563934, -0.09904293715953827, -0.094125896692276, -0.08920887112617493, -0.08429183810949326, -0.07937480509281158, -0.07445777207612991, -0.06954073905944824, -0.06462370604276657, -0.0597066767513752, -0.05478964373469353, -0.049872614443302155, -0.04495558142662048, -0.04003854840993881, -0.03512151539325714, -0.03020448423922062, -0.025287453085184097, -0.020370420068502426, -0.015453387051820755, -0.010536355897784233, -0.005619324743747711, -0.00070229172706604, 0.0042147403582930565, 0.009131772443652153, 0.01404880452901125, 0.018965836614370346, 0.023882869631052017, 0.02879990078508854, 0.03371693193912506, 0.03863396495580673, 0.0435509979724884, 0.048468030989170074, 0.05338506028056145, 0.05830209329724312, 0.06321913003921509, 0.06813615560531616, 0.07305318862199783, 0.0779702216386795, 0.08288725465536118, 0.08780428767204285, 0.09272132068872452, 0.09763835370540619, 0.10255537927150726, 0.10747241228818893, 0.1123894453048706, 0.11730647832155228, 0.12222351133823395, 0.12714053690433502, 0.1320575773715973, 0.13697460293769836, 0.14189164340496063, 0.1468086689710617, 0.15172570943832397, 0.15664273500442505]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 8.0, 9.0, 14.0, 20.0, 32.0, 42.0, 63.0, 97.0, 123.0, 184.0, 265.0, 400.0, 608.0, 1187.0, 2294.0, 5076.0, 12257.0, 35721.0, 121031.0, 371742.0, 340346.0, 104746.0, 31591.0, 11169.0, 4576.0, 2085.0, 1105.0, 594.0, 370.0, 224.0, 172.0, 115.0, 89.0, 53.0, 38.0, 32.0, 13.0, 18.0, 15.0, 7.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29784393310546875, -0.2888031005859375, -0.27976226806640625, -0.270721435546875, -0.26168060302734375, -0.2526397705078125, -0.24359893798828125, -0.23455810546875, -0.22551727294921875, -0.2164764404296875, -0.20743560791015625, -0.198394775390625, -0.18935394287109375, -0.1803131103515625, -0.17127227783203125, -0.1622314453125, -0.15319061279296875, -0.1441497802734375, -0.13510894775390625, -0.126068115234375, -0.11702728271484375, -0.1079864501953125, -0.09894561767578125, -0.08990478515625, -0.08086395263671875, -0.0718231201171875, -0.06278228759765625, -0.053741455078125, -0.04470062255859375, -0.0356597900390625, -0.02661895751953125, -0.017578125, -0.00853729248046875, 0.0005035400390625, 0.00954437255859375, 0.018585205078125, 0.02762603759765625, 0.0366668701171875, 0.04570770263671875, 0.05474853515625, 0.06378936767578125, 0.0728302001953125, 0.08187103271484375, 0.090911865234375, 0.09995269775390625, 0.1089935302734375, 0.11803436279296875, 0.1270751953125, 0.13611602783203125, 0.1451568603515625, 0.15419769287109375, 0.163238525390625, 0.17227935791015625, 0.1813201904296875, 0.19036102294921875, 0.19940185546875, 0.20844268798828125, 0.2174835205078125, 0.22652435302734375, 0.235565185546875, 0.24460601806640625, 0.2536468505859375, 0.26268768310546875, 0.271728515625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 13.0, 6.0, 28.0, 21.0, 24.0, 26.0, 35.0, 43.0, 50.0, 68.0, 69.0, 65.0, 60.0, 65.0, 73.0, 66.0, 67.0, 46.0, 41.0, 33.0, 24.0, 23.0, 13.0, 8.0, 13.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2242431640625, -0.2181072235107422, -0.21197128295898438, -0.20583534240722656, -0.19969940185546875, -0.19356346130371094, -0.18742752075195312, -0.1812915802001953, -0.1751556396484375, -0.1690196990966797, -0.16288375854492188, -0.15674781799316406, -0.15061187744140625, -0.14447593688964844, -0.13833999633789062, -0.1322040557861328, -0.126068115234375, -0.11993217468261719, -0.11379623413085938, -0.10766029357910156, -0.10152435302734375, -0.09538841247558594, -0.08925247192382812, -0.08311653137207031, -0.0769805908203125, -0.07084465026855469, -0.06470870971679688, -0.05857276916503906, -0.05243682861328125, -0.04630088806152344, -0.040164947509765625, -0.03402900695800781, -0.02789306640625, -0.021757125854492188, -0.015621185302734375, -0.009485244750976562, -0.00334930419921875, 0.0027866363525390625, 0.008922576904296875, 0.015058517456054688, 0.0211944580078125, 0.027330398559570312, 0.033466339111328125, 0.03960227966308594, 0.04573822021484375, 0.05187416076660156, 0.058010101318359375, 0.06414604187011719, 0.070281982421875, 0.07641792297363281, 0.08255386352539062, 0.08868980407714844, 0.09482574462890625, 0.10096168518066406, 0.10709762573242188, 0.11323356628417969, 0.1193695068359375, 0.1255054473876953, 0.13164138793945312, 0.13777732849121094, 0.14391326904296875, 0.15004920959472656, 0.15618515014648438, 0.1623210906982422, 0.16845703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 6.0, 4.0, 9.0, 14.0, 21.0, 29.0, 33.0, 61.0, 74.0, 121.0, 224.0, 326.0, 565.0, 1117.0, 2897.0, 10526.0, 59533.0, 459226.0, 440968.0, 57024.0, 10346.0, 2898.0, 1118.0, 558.0, 330.0, 190.0, 131.0, 65.0, 54.0, 36.0, 23.0, 14.0, 6.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363037109375, -0.3516883850097656, -0.34033966064453125, -0.3289909362792969, -0.3176422119140625, -0.3062934875488281, -0.29494476318359375, -0.2835960388183594, -0.272247314453125, -0.2608985900878906, -0.24954986572265625, -0.23820114135742188, -0.2268524169921875, -0.21550369262695312, -0.20415496826171875, -0.19280624389648438, -0.18145751953125, -0.17010879516601562, -0.15876007080078125, -0.14741134643554688, -0.1360626220703125, -0.12471389770507812, -0.11336517333984375, -0.10201644897460938, -0.090667724609375, -0.07931900024414062, -0.06797027587890625, -0.056621551513671875, -0.0452728271484375, -0.033924102783203125, -0.02257537841796875, -0.011226654052734375, 0.0001220703125, 0.011470794677734375, 0.02281951904296875, 0.034168243408203125, 0.0455169677734375, 0.056865692138671875, 0.06821441650390625, 0.07956314086914062, 0.090911865234375, 0.10226058959960938, 0.11360931396484375, 0.12495803833007812, 0.1363067626953125, 0.14765548706054688, 0.15900421142578125, 0.17035293579101562, 0.18170166015625, 0.19305038452148438, 0.20439910888671875, 0.21574783325195312, 0.2270965576171875, 0.23844528198242188, 0.24979400634765625, 0.2611427307128906, 0.272491455078125, 0.2838401794433594, 0.29518890380859375, 0.3065376281738281, 0.3178863525390625, 0.3292350769042969, 0.34058380126953125, 0.3519325256347656, 0.36328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 11.0, 5.0, 10.0, 9.0, 8.0, 14.0, 17.0, 23.0, 27.0, 27.0, 32.0, 50.0, 40.0, 48.0, 61.0, 39.0, 41.0, 65.0, 50.0, 41.0, 50.0, 43.0, 39.0, 44.0, 37.0, 30.0, 33.0, 27.0, 21.0, 17.0, 7.0, 13.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69970703125, -0.67938232421875, -0.6590576171875, -0.63873291015625, -0.618408203125, -0.59808349609375, -0.5777587890625, -0.55743408203125, -0.537109375, -0.51678466796875, -0.4964599609375, -0.47613525390625, -0.455810546875, -0.43548583984375, -0.4151611328125, -0.39483642578125, -0.37451171875, -0.35418701171875, -0.3338623046875, -0.31353759765625, -0.293212890625, -0.27288818359375, -0.2525634765625, -0.23223876953125, -0.2119140625, -0.19158935546875, -0.1712646484375, -0.15093994140625, -0.130615234375, -0.11029052734375, -0.0899658203125, -0.06964111328125, -0.04931640625, -0.02899169921875, -0.0086669921875, 0.01165771484375, 0.031982421875, 0.05230712890625, 0.0726318359375, 0.09295654296875, 0.11328125, 0.13360595703125, 0.1539306640625, 0.17425537109375, 0.194580078125, 0.21490478515625, 0.2352294921875, 0.25555419921875, 0.27587890625, 0.29620361328125, 0.3165283203125, 0.33685302734375, 0.357177734375, 0.37750244140625, 0.3978271484375, 0.41815185546875, 0.4384765625, 0.45880126953125, 0.4791259765625, 0.49945068359375, 0.519775390625, 0.54010009765625, 0.5604248046875, 0.58074951171875, 0.60107421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 16.0, 31.0, 54.0, 120.0, 209.0, 651.0, 1980.0, 8954.0, 115927.0, 850253.0, 61387.0, 6341.0, 1576.0, 576.0, 236.0, 110.0, 51.0, 24.0, 13.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.2357196807861328, -0.22742080688476562, -0.21912193298339844, -0.21082305908203125, -0.20252418518066406, -0.19422531127929688, -0.1859264373779297, -0.1776275634765625, -0.1693286895751953, -0.16102981567382812, -0.15273094177246094, -0.14443206787109375, -0.13613319396972656, -0.12783432006835938, -0.11953544616699219, -0.111236572265625, -0.10293769836425781, -0.09463882446289062, -0.08633995056152344, -0.07804107666015625, -0.06974220275878906, -0.061443328857421875, -0.05314445495605469, -0.0448455810546875, -0.03654670715332031, -0.028247833251953125, -0.019948959350585938, -0.01165008544921875, -0.0033512115478515625, 0.004947662353515625, 0.013246536254882812, 0.02154541015625, 0.029844284057617188, 0.038143157958984375, 0.04644203186035156, 0.05474090576171875, 0.06303977966308594, 0.07133865356445312, 0.07963752746582031, 0.0879364013671875, 0.09623527526855469, 0.10453414916992188, 0.11283302307128906, 0.12113189697265625, 0.12943077087402344, 0.13772964477539062, 0.1460285186767578, 0.154327392578125, 0.1626262664794922, 0.17092514038085938, 0.17922401428222656, 0.18752288818359375, 0.19582176208496094, 0.20412063598632812, 0.2124195098876953, 0.2207183837890625, 0.2290172576904297, 0.23731613159179688, 0.24561500549316406, 0.25391387939453125, 0.26221275329589844, 0.2705116271972656, 0.2788105010986328, 0.287109375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 7.0, 3.0, 4.0, 5.0, 7.0, 17.0, 11.0, 11.0, 16.0, 23.0, 32.0, 38.0, 47.0, 66.0, 73.0, 85.0, 108.0, 88.0, 61.0, 65.0, 53.0, 48.0, 35.0, 13.0, 12.0, 14.0, 18.0, 6.0, 7.0, 2.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.554624557495117e-05, -9.220093488693237e-05, -8.885562419891357e-05, -8.551031351089478e-05, -8.216500282287598e-05, -7.881969213485718e-05, -7.547438144683838e-05, -7.212907075881958e-05, -6.878376007080078e-05, -6.543844938278198e-05, -6.209313869476318e-05, -5.8747828006744385e-05, -5.5402517318725586e-05, -5.205720663070679e-05, -4.871189594268799e-05, -4.536658525466919e-05, -4.202127456665039e-05, -3.867596387863159e-05, -3.533065319061279e-05, -3.1985342502593994e-05, -2.8640031814575195e-05, -2.5294721126556396e-05, -2.1949410438537598e-05, -1.86040997505188e-05, -1.52587890625e-05, -1.1913478374481201e-05, -8.568167686462402e-06, -5.2228569984436035e-06, -1.8775463104248047e-06, 1.4677643775939941e-06, 4.813075065612793e-06, 8.158385753631592e-06, 1.150369644165039e-05, 1.484900712966919e-05, 1.8194317817687988e-05, 2.1539628505706787e-05, 2.4884939193725586e-05, 2.8230249881744385e-05, 3.1575560569763184e-05, 3.492087125778198e-05, 3.826618194580078e-05, 4.161149263381958e-05, 4.495680332183838e-05, 4.830211400985718e-05, 5.1647424697875977e-05, 5.4992735385894775e-05, 5.8338046073913574e-05, 6.168335676193237e-05, 6.502866744995117e-05, 6.837397813796997e-05, 7.171928882598877e-05, 7.506459951400757e-05, 7.840991020202637e-05, 8.175522089004517e-05, 8.510053157806396e-05, 8.844584226608276e-05, 9.179115295410156e-05, 9.513646364212036e-05, 9.848177433013916e-05, 0.00010182708501815796, 0.00010517239570617676, 0.00010851770639419556, 0.00011186301708221436, 0.00011520832777023315, 0.00011855363845825195]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 10.0, 11.0, 11.0, 18.0, 16.0, 30.0, 64.0, 78.0, 168.0, 333.0, 690.0, 1480.0, 4217.0, 16725.0, 162014.0, 745978.0, 98455.0, 12289.0, 3427.0, 1312.0, 516.0, 283.0, 159.0, 94.0, 51.0, 38.0, 29.0, 17.0, 11.0, 9.0, 4.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.177978515625, -0.17192649841308594, -0.16587448120117188, -0.1598224639892578, -0.15377044677734375, -0.1477184295654297, -0.14166641235351562, -0.13561439514160156, -0.1295623779296875, -0.12351036071777344, -0.11745834350585938, -0.11140632629394531, -0.10535430908203125, -0.09930229187011719, -0.09325027465820312, -0.08719825744628906, -0.081146240234375, -0.07509422302246094, -0.06904220581054688, -0.06299018859863281, -0.05693817138671875, -0.05088615417480469, -0.044834136962890625, -0.03878211975097656, -0.0327301025390625, -0.026678085327148438, -0.020626068115234375, -0.014574050903320312, -0.00852203369140625, -0.0024700164794921875, 0.003582000732421875, 0.009634017944335938, 0.01568603515625, 0.021738052368164062, 0.027790069580078125, 0.03384208679199219, 0.03989410400390625, 0.04594612121582031, 0.051998138427734375, 0.05805015563964844, 0.0641021728515625, 0.07015419006347656, 0.07620620727539062, 0.08225822448730469, 0.08831024169921875, 0.09436225891113281, 0.10041427612304688, 0.10646629333496094, 0.112518310546875, 0.11857032775878906, 0.12462234497070312, 0.1306743621826172, 0.13672637939453125, 0.1427783966064453, 0.14883041381835938, 0.15488243103027344, 0.1609344482421875, 0.16698646545410156, 0.17303848266601562, 0.1790904998779297, 0.18514251708984375, 0.1911945343017578, 0.19724655151367188, 0.20329856872558594, 0.2093505859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 15.0, 29.0, 41.0, 89.0, 121.0, 170.0, 171.0, 155.0, 89.0, 50.0, 21.0, 16.0, 4.0, 7.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19970703125, -0.18926239013671875, -0.1788177490234375, -0.16837310791015625, -0.157928466796875, -0.14748382568359375, -0.1370391845703125, -0.12659454345703125, -0.11614990234375, -0.10570526123046875, -0.0952606201171875, -0.08481597900390625, -0.074371337890625, -0.06392669677734375, -0.0534820556640625, -0.04303741455078125, -0.0325927734375, -0.02214813232421875, -0.0117034912109375, -0.00125885009765625, 0.009185791015625, 0.01963043212890625, 0.0300750732421875, 0.04051971435546875, 0.05096435546875, 0.06140899658203125, 0.0718536376953125, 0.08229827880859375, 0.092742919921875, 0.10318756103515625, 0.1136322021484375, 0.12407684326171875, 0.134521484375, 0.14496612548828125, 0.1554107666015625, 0.16585540771484375, 0.176300048828125, 0.18674468994140625, 0.1971893310546875, 0.20763397216796875, 0.21807861328125, 0.22852325439453125, 0.2389678955078125, 0.24941253662109375, 0.259857177734375, 0.27030181884765625, 0.2807464599609375, 0.29119110107421875, 0.3016357421875, 0.31208038330078125, 0.3225250244140625, 0.33296966552734375, 0.343414306640625, 0.35385894775390625, 0.3643035888671875, 0.37474822998046875, 0.38519287109375, 0.39563751220703125, 0.4060821533203125, 0.41652679443359375, 0.426971435546875, 0.43741607666015625, 0.4478607177734375, 0.45830535888671875, 0.46875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 13.0, 20.0, 15.0, 27.0, 42.0, 60.0, 98.0, 138.0, 164.0, 150.0, 116.0, 63.0, 43.0, 19.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9455392360687256, -1.8637481927871704, -1.7819571495056152, -1.7001662254333496, -1.6183751821517944, -1.5365841388702393, -1.4547932147979736, -1.3730021715164185, -1.2912111282348633, -1.209420084953308, -1.127629041671753, -1.0458381175994873, -0.9640470743179321, -0.882256031036377, -0.8004650473594666, -0.7186740636825562, -0.636883020401001, -0.5550919771194458, -0.4733009934425354, -0.3915099799633026, -0.3097189664840698, -0.22792795300483704, -0.14613693952560425, -0.06434595584869385, 0.017445087432861328, 0.09923610091209412, 0.1810271143913269, 0.2628181278705597, 0.3446091413497925, 0.42640015482902527, 0.5081911683082581, 0.5899821519851685, 0.6717734336853027, 0.7535644769668579, 0.8353554606437683, 0.9171464443206787, 0.9989374876022339, 1.080728530883789, 1.1625194549560547, 1.2443104982376099, 1.326101541519165, 1.4078925848007202, 1.4896836280822754, 1.571474552154541, 1.6532655954360962, 1.7350566387176514, 1.816847562789917, 1.8986386060714722, 1.9804296493530273, 2.062220573425293, 2.1440117359161377, 2.2258026599884033, 2.307593822479248, 2.3893847465515137, 2.4711756706237793, 2.552966594696045, 2.6347577571868896, 2.7165486812591553, 2.79833984375, 2.8801307678222656, 2.9619216918945312, 3.043712854385376, 3.1255037784576416, 3.2072949409484863, 3.289085865020752]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 11.0, 2.0, 9.0, 4.0, 13.0, 9.0, 9.0, 16.0, 19.0, 27.0, 27.0, 25.0, 26.0, 42.0, 37.0, 34.0, 53.0, 50.0, 48.0, 52.0, 66.0, 43.0, 33.0, 27.0, 35.0, 31.0, 34.0, 26.0, 28.0, 29.0, 17.0, 18.0, 11.0, 15.0, 16.0, 11.0, 11.0, 5.0, 4.0, 8.0, 10.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.0298027992248535, -2.9452853202819824, -2.8607680797576904, -2.7762506008148193, -2.6917331218719482, -2.607215642929077, -2.522698402404785, -2.438180923461914, -2.353663444519043, -2.269145965576172, -2.18462872505188, -2.100111246109009, -2.0155937671661377, -1.9310764074325562, -1.8465590476989746, -1.7620415687561035, -1.677524209022522, -1.5930068492889404, -1.5084893703460693, -1.4239720106124878, -1.3394545316696167, -1.2549371719360352, -1.170419692993164, -1.0859023332595825, -1.001384973526001, -0.9168675541877747, -0.8323501348495483, -0.7478327751159668, -0.6633152961730957, -0.5787979364395142, -0.49428051710128784, -0.4097630977630615, -0.32524561882019043, -0.2407281994819641, -0.156210795044899, -0.07169339060783386, 0.012824028730392456, 0.09734144806861877, 0.1818588376045227, 0.266376256942749, 0.35089367628097534, 0.43541109561920166, 0.519928514957428, 0.6044459342956543, 0.6889632940292358, 0.7734807729721069, 0.8579981327056885, 0.9425155520439148, 1.0270329713821411, 1.1115503311157227, 1.1960678100585938, 1.2805851697921753, 1.3651026487350464, 1.449620008468628, 1.534137487411499, 1.6186548471450806, 1.703172206878662, 1.7876895666122437, 1.8722070455551147, 1.9567244052886963, 2.0412418842315674, 2.1257593631744385, 2.2102766036987305, 2.2947940826416016, 2.3793115615844727]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 7.0, 9.0, 15.0, 16.0, 30.0, 46.0, 95.0, 160.0, 292.0, 633.0, 1792.0, 7861.0, 4082732.0, 93825.0, 4436.0, 1244.0, 515.0, 242.0, 132.0, 64.0, 42.0, 23.0, 16.0, 14.0, 11.0, 6.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67578125, -0.6474456787109375, -0.619110107421875, -0.5907745361328125, -0.56243896484375, -0.5341033935546875, -0.505767822265625, -0.4774322509765625, -0.4490966796875, -0.4207611083984375, -0.392425537109375, -0.3640899658203125, -0.33575439453125, -0.3074188232421875, -0.279083251953125, -0.2507476806640625, -0.222412109375, -0.1940765380859375, -0.165740966796875, -0.1374053955078125, -0.10906982421875, -0.0807342529296875, -0.052398681640625, -0.0240631103515625, 0.0042724609375, 0.0326080322265625, 0.060943603515625, 0.0892791748046875, 0.11761474609375, 0.1459503173828125, 0.174285888671875, 0.2026214599609375, 0.23095703125, 0.2592926025390625, 0.287628173828125, 0.3159637451171875, 0.34429931640625, 0.3726348876953125, 0.400970458984375, 0.4293060302734375, 0.4576416015625, 0.4859771728515625, 0.514312744140625, 0.5426483154296875, 0.57098388671875, 0.5993194580078125, 0.627655029296875, 0.6559906005859375, 0.684326171875, 0.7126617431640625, 0.740997314453125, 0.7693328857421875, 0.79766845703125, 0.8260040283203125, 0.854339599609375, 0.8826751708984375, 0.9110107421875, 0.9393463134765625, 0.967681884765625, 0.9960174560546875, 1.02435302734375, 1.0526885986328125, 1.081024169921875, 1.1093597412109375, 1.1376953125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 10.0, 12.0, 18.0, 16.0, 31.0, 30.0, 33.0, 30.0, 58.0, 58.0, 58.0, 64.0, 49.0, 71.0, 61.0, 68.0, 52.0, 45.0, 44.0, 28.0, 23.0, 25.0, 25.0, 20.0, 10.0, 16.0, 11.0, 6.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2269287109375, -0.2207965850830078, -0.21466445922851562, -0.20853233337402344, -0.20240020751953125, -0.19626808166503906, -0.19013595581054688, -0.1840038299560547, -0.1778717041015625, -0.1717395782470703, -0.16560745239257812, -0.15947532653808594, -0.15334320068359375, -0.14721107482910156, -0.14107894897460938, -0.1349468231201172, -0.128814697265625, -0.12268257141113281, -0.11655044555664062, -0.11041831970214844, -0.10428619384765625, -0.09815406799316406, -0.09202194213867188, -0.08588981628417969, -0.0797576904296875, -0.07362556457519531, -0.06749343872070312, -0.06136131286621094, -0.05522918701171875, -0.04909706115722656, -0.042964935302734375, -0.03683280944824219, -0.03070068359375, -0.024568557739257812, -0.018436431884765625, -0.012304306030273438, -0.00617218017578125, -4.00543212890625e-05, 0.006092071533203125, 0.012224197387695312, 0.0183563232421875, 0.024488449096679688, 0.030620574951171875, 0.03675270080566406, 0.04288482666015625, 0.04901695251464844, 0.055149078369140625, 0.06128120422363281, 0.067413330078125, 0.07354545593261719, 0.07967758178710938, 0.08580970764160156, 0.09194183349609375, 0.09807395935058594, 0.10420608520507812, 0.11033821105957031, 0.1164703369140625, 0.12260246276855469, 0.12873458862304688, 0.13486671447753906, 0.14099884033203125, 0.14713096618652344, 0.15326309204101562, 0.1593952178955078, 0.16552734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 7.0, 1.0, 5.0, 4.0, 11.0, 13.0, 18.0, 22.0, 24.0, 31.0, 38.0, 54.0, 99.0, 148.0, 239.0, 399.0, 724.0, 1280.0, 2787.0, 7816.0, 50247.0, 4061356.0, 54675.0, 8155.0, 2907.0, 1311.0, 702.0, 389.0, 265.0, 143.0, 100.0, 76.0, 58.0, 41.0, 26.0, 27.0, 19.0, 16.0, 8.0, 7.0, 5.0, 2.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.429931640625, -0.416290283203125, -0.40264892578125, -0.389007568359375, -0.3753662109375, -0.361724853515625, -0.34808349609375, -0.334442138671875, -0.32080078125, -0.307159423828125, -0.29351806640625, -0.279876708984375, -0.2662353515625, -0.252593994140625, -0.23895263671875, -0.225311279296875, -0.211669921875, -0.198028564453125, -0.18438720703125, -0.170745849609375, -0.1571044921875, -0.143463134765625, -0.12982177734375, -0.116180419921875, -0.1025390625, -0.088897705078125, -0.07525634765625, -0.061614990234375, -0.0479736328125, -0.034332275390625, -0.02069091796875, -0.007049560546875, 0.006591796875, 0.020233154296875, 0.03387451171875, 0.047515869140625, 0.0611572265625, 0.074798583984375, 0.08843994140625, 0.102081298828125, 0.11572265625, 0.129364013671875, 0.14300537109375, 0.156646728515625, 0.1702880859375, 0.183929443359375, 0.19757080078125, 0.211212158203125, 0.224853515625, 0.238494873046875, 0.25213623046875, 0.265777587890625, 0.2794189453125, 0.293060302734375, 0.30670166015625, 0.320343017578125, 0.333984375, 0.347625732421875, 0.36126708984375, 0.374908447265625, 0.3885498046875, 0.402191162109375, 0.41583251953125, 0.429473876953125, 0.443115234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 1.0, 2.0, 14.0, 25.0, 80.0, 3577.0, 289.0, 49.0, 26.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.26122188568115234, -0.2551097869873047, -0.24899768829345703, -0.24288558959960938, -0.23677349090576172, -0.23066139221191406, -0.2245492935180664, -0.21843719482421875, -0.2123250961303711, -0.20621299743652344, -0.20010089874267578, -0.19398880004882812, -0.18787670135498047, -0.1817646026611328, -0.17565250396728516, -0.1695404052734375, -0.16342830657958984, -0.1573162078857422, -0.15120410919189453, -0.14509201049804688, -0.13897991180419922, -0.13286781311035156, -0.1267557144165039, -0.12064361572265625, -0.1145315170288086, -0.10841941833496094, -0.10230731964111328, -0.09619522094726562, -0.09008312225341797, -0.08397102355957031, -0.07785892486572266, -0.071746826171875, -0.06563472747802734, -0.05952262878417969, -0.05341053009033203, -0.047298431396484375, -0.04118633270263672, -0.03507423400878906, -0.028962135314941406, -0.02285003662109375, -0.016737937927246094, -0.010625839233398438, -0.004513740539550781, 0.001598358154296875, 0.007710456848144531, 0.013822555541992188, 0.019934654235839844, 0.0260467529296875, 0.032158851623535156, 0.03827095031738281, 0.04438304901123047, 0.050495147705078125, 0.05660724639892578, 0.06271934509277344, 0.0688314437866211, 0.07494354248046875, 0.0810556411743164, 0.08716773986816406, 0.09327983856201172, 0.09939193725585938, 0.10550403594970703, 0.11161613464355469, 0.11772823333740234, 0.12384033203125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 20.0, 48.0, 71.0, 124.0, 163.0, 176.0, 147.0, 109.0, 65.0, 34.0, 15.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5215672254562378, -0.508392333984375, -0.495217502117157, -0.4820426106452942, -0.4688677489757538, -0.4556928873062134, -0.4425179958343506, -0.4293431341648102, -0.4161682724952698, -0.40299341082572937, -0.38981854915618896, -0.37664365768432617, -0.36346879601478577, -0.35029393434524536, -0.33711904287338257, -0.32394418120384216, -0.31076931953430176, -0.29759445786476135, -0.28441959619522095, -0.27124470472335815, -0.25806984305381775, -0.24489498138427734, -0.23172010481357574, -0.21854522824287415, -0.20537036657333374, -0.19219550490379333, -0.17902062833309174, -0.16584575176239014, -0.15267089009284973, -0.13949602842330933, -0.12632115185260773, -0.11314628273248672, -0.09997141361236572, -0.08679654449224472, -0.07362167537212372, -0.060446806252002716, -0.047271937131881714, -0.03409706801176071, -0.02092219889163971, -0.007747329771518707, 0.005427539348602295, 0.018602408468723297, 0.0317772775888443, 0.0449521467089653, 0.058127015829086304, 0.0713018849492073, 0.08447675406932831, 0.09765162318944931, 0.11082649230957031, 0.12400136142969131, 0.13717623054981232, 0.15035110712051392, 0.16352596879005432, 0.17670083045959473, 0.18987570703029633, 0.20305058360099792, 0.21622544527053833, 0.22940030694007874, 0.24257518351078033, 0.25575006008148193, 0.26892492175102234, 0.28209978342056274, 0.29527467489242554, 0.30844953656196594, 0.32162439823150635]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 6.0, 11.0, 10.0, 16.0, 12.0, 26.0, 18.0, 21.0, 24.0, 23.0, 37.0, 41.0, 43.0, 43.0, 42.0, 40.0, 52.0, 46.0, 51.0, 49.0, 50.0, 42.0, 38.0, 45.0, 30.0, 28.0, 30.0, 28.0, 16.0, 19.0, 12.0, 12.0, 9.0, 5.0, 1.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22378134727478027, -0.21661347150802612, -0.20944559574127197, -0.20227771997451782, -0.19510984420776367, -0.18794196844100952, -0.18077409267425537, -0.17360621690750122, -0.16643834114074707, -0.15927046537399292, -0.15210258960723877, -0.14493471384048462, -0.13776683807373047, -0.13059896230697632, -0.12343109399080276, -0.11626321822404861, -0.10909534990787506, -0.10192747414112091, -0.09475959837436676, -0.08759172260761261, -0.08042384684085846, -0.07325597107410431, -0.06608810275793076, -0.058920226991176605, -0.051752351224422455, -0.044584475457668304, -0.037416599690914154, -0.030248727649450302, -0.02308085188269615, -0.015912976115942, -0.00874510407447815, -0.001577228307723999, 0.005590647459030151, 0.012758522294461727, 0.019926397129893303, 0.027094271034002304, 0.034262146800756454, 0.041430022567510605, 0.04859789460897446, 0.05576577037572861, 0.06293364614248276, 0.07010152190923691, 0.07726939767599106, 0.08443726599216461, 0.09160514175891876, 0.09877301752567291, 0.10594089329242706, 0.11310876905918121, 0.12027664482593536, 0.12744452059268951, 0.13461239635944366, 0.14178027212619781, 0.14894814789295197, 0.15611602365970612, 0.16328388452529907, 0.17045176029205322, 0.17761963605880737, 0.18478751182556152, 0.19195538759231567, 0.19912326335906982, 0.20629113912582397, 0.21345901489257812, 0.22062689065933228, 0.22779476642608643, 0.23496264219284058]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 5.0, 16.0, 16.0, 26.0, 41.0, 63.0, 114.0, 187.0, 332.0, 721.0, 1794.0, 5629.0, 26799.0, 197356.0, 629659.0, 155930.0, 21931.0, 4942.0, 1533.0, 637.0, 340.0, 190.0, 96.0, 69.0, 44.0, 21.0, 22.0, 15.0, 6.0, 3.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291015625, -0.27860260009765625, -0.2661895751953125, -0.25377655029296875, -0.241363525390625, -0.22895050048828125, -0.2165374755859375, -0.20412445068359375, -0.19171142578125, -0.17929840087890625, -0.1668853759765625, -0.15447235107421875, -0.142059326171875, -0.12964630126953125, -0.1172332763671875, -0.10482025146484375, -0.0924072265625, -0.07999420166015625, -0.0675811767578125, -0.05516815185546875, -0.042755126953125, -0.03034210205078125, -0.0179290771484375, -0.00551605224609375, 0.00689697265625, 0.01930999755859375, 0.0317230224609375, 0.04413604736328125, 0.056549072265625, 0.06896209716796875, 0.0813751220703125, 0.09378814697265625, 0.106201171875, 0.11861419677734375, 0.1310272216796875, 0.14344024658203125, 0.155853271484375, 0.16826629638671875, 0.1806793212890625, 0.19309234619140625, 0.20550537109375, 0.21791839599609375, 0.2303314208984375, 0.24274444580078125, 0.255157470703125, 0.26757049560546875, 0.2799835205078125, 0.29239654541015625, 0.3048095703125, 0.31722259521484375, 0.3296356201171875, 0.34204864501953125, 0.354461669921875, 0.36687469482421875, 0.3792877197265625, 0.39170074462890625, 0.40411376953125, 0.41652679443359375, 0.4289398193359375, 0.44135284423828125, 0.453765869140625, 0.46617889404296875, 0.4785919189453125, 0.49100494384765625, 0.50341796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 9.0, 14.0, 14.0, 17.0, 23.0, 34.0, 30.0, 43.0, 34.0, 47.0, 47.0, 62.0, 58.0, 62.0, 76.0, 68.0, 50.0, 47.0, 39.0, 39.0, 33.0, 22.0, 24.0, 26.0, 16.0, 15.0, 13.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.22509765625, -0.21892738342285156, -0.21275711059570312, -0.2065868377685547, -0.20041656494140625, -0.1942462921142578, -0.18807601928710938, -0.18190574645996094, -0.1757354736328125, -0.16956520080566406, -0.16339492797851562, -0.1572246551513672, -0.15105438232421875, -0.1448841094970703, -0.13871383666992188, -0.13254356384277344, -0.126373291015625, -0.12020301818847656, -0.11403274536132812, -0.10786247253417969, -0.10169219970703125, -0.09552192687988281, -0.08935165405273438, -0.08318138122558594, -0.0770111083984375, -0.07084083557128906, -0.06467056274414062, -0.05850028991699219, -0.05233001708984375, -0.04615974426269531, -0.039989471435546875, -0.03381919860839844, -0.02764892578125, -0.021478652954101562, -0.015308380126953125, -0.009138107299804688, -0.00296783447265625, 0.0032024383544921875, 0.009372711181640625, 0.015542984008789062, 0.0217132568359375, 0.027883529663085938, 0.034053802490234375, 0.04022407531738281, 0.04639434814453125, 0.05256462097167969, 0.058734893798828125, 0.06490516662597656, 0.071075439453125, 0.07724571228027344, 0.08341598510742188, 0.08958625793457031, 0.09575653076171875, 0.10192680358886719, 0.10809707641601562, 0.11426734924316406, 0.1204376220703125, 0.12660789489746094, 0.13277816772460938, 0.1389484405517578, 0.14511871337890625, 0.1512889862060547, 0.15745925903320312, 0.16362953186035156, 0.1697998046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 10.0, 6.0, 12.0, 13.0, 24.0, 27.0, 45.0, 87.0, 142.0, 257.0, 412.0, 932.0, 2305.0, 7677.0, 80388.0, 859631.0, 84587.0, 7812.0, 2300.0, 890.0, 433.0, 226.0, 124.0, 83.0, 47.0, 25.0, 13.0, 21.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5278701782226562, -0.5093536376953125, -0.49083709716796875, -0.472320556640625, -0.45380401611328125, -0.4352874755859375, -0.41677093505859375, -0.39825439453125, -0.37973785400390625, -0.3612213134765625, -0.34270477294921875, -0.324188232421875, -0.30567169189453125, -0.2871551513671875, -0.26863861083984375, -0.2501220703125, -0.23160552978515625, -0.2130889892578125, -0.19457244873046875, -0.176055908203125, -0.15753936767578125, -0.1390228271484375, -0.12050628662109375, -0.10198974609375, -0.08347320556640625, -0.0649566650390625, -0.04644012451171875, -0.027923583984375, -0.00940704345703125, 0.0091094970703125, 0.02762603759765625, 0.046142578125, 0.06465911865234375, 0.0831756591796875, 0.10169219970703125, 0.120208740234375, 0.13872528076171875, 0.1572418212890625, 0.17575836181640625, 0.19427490234375, 0.21279144287109375, 0.2313079833984375, 0.24982452392578125, 0.268341064453125, 0.28685760498046875, 0.3053741455078125, 0.32389068603515625, 0.3424072265625, 0.36092376708984375, 0.3794403076171875, 0.39795684814453125, 0.416473388671875, 0.43498992919921875, 0.4535064697265625, 0.47202301025390625, 0.49053955078125, 0.5090560913085938, 0.5275726318359375, 0.5460891723632812, 0.564605712890625, 0.5831222534179688, 0.6016387939453125, 0.6201553344726562, 0.638671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 16.0, 17.0, 16.0, 45.0, 62.0, 73.0, 107.0, 126.0, 95.0, 96.0, 97.0, 81.0, 71.0, 42.0, 13.0, 13.0, 6.0, 8.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2679290771484375, -1.216522216796875, -1.1651153564453125, -1.11370849609375, -1.0623016357421875, -1.010894775390625, -0.9594879150390625, -0.9080810546875, -0.8566741943359375, -0.805267333984375, -0.7538604736328125, -0.70245361328125, -0.6510467529296875, -0.599639892578125, -0.5482330322265625, -0.496826171875, -0.4454193115234375, -0.394012451171875, -0.3426055908203125, -0.29119873046875, -0.2397918701171875, -0.188385009765625, -0.1369781494140625, -0.0855712890625, -0.0341644287109375, 0.017242431640625, 0.0686492919921875, 0.12005615234375, 0.1714630126953125, 0.222869873046875, 0.2742767333984375, 0.32568359375, 0.3770904541015625, 0.428497314453125, 0.4799041748046875, 0.53131103515625, 0.5827178955078125, 0.634124755859375, 0.6855316162109375, 0.7369384765625, 0.7883453369140625, 0.839752197265625, 0.8911590576171875, 0.94256591796875, 0.9939727783203125, 1.045379638671875, 1.0967864990234375, 1.148193359375, 1.1996002197265625, 1.251007080078125, 1.3024139404296875, 1.35382080078125, 1.4052276611328125, 1.456634521484375, 1.5080413818359375, 1.5594482421875, 1.6108551025390625, 1.662261962890625, 1.7136688232421875, 1.76507568359375, 1.8164825439453125, 1.867889404296875, 1.9192962646484375, 1.970703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 9.0, 10.0, 33.0, 44.0, 199.0, 1083.0, 972378.0, 73845.0, 696.0, 157.0, 52.0, 15.0, 9.0, 12.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -0.982269287109375, -0.92742919921875, -0.872589111328125, -0.8177490234375, -0.762908935546875, -0.70806884765625, -0.653228759765625, -0.598388671875, -0.543548583984375, -0.48870849609375, -0.433868408203125, -0.3790283203125, -0.324188232421875, -0.26934814453125, -0.214508056640625, -0.15966796875, -0.104827880859375, -0.04998779296875, 0.004852294921875, 0.0596923828125, 0.114532470703125, 0.16937255859375, 0.224212646484375, 0.279052734375, 0.333892822265625, 0.38873291015625, 0.443572998046875, 0.4984130859375, 0.553253173828125, 0.60809326171875, 0.662933349609375, 0.7177734375, 0.772613525390625, 0.82745361328125, 0.882293701171875, 0.9371337890625, 0.991973876953125, 1.04681396484375, 1.101654052734375, 1.156494140625, 1.211334228515625, 1.26617431640625, 1.321014404296875, 1.3758544921875, 1.430694580078125, 1.48553466796875, 1.540374755859375, 1.59521484375, 1.650054931640625, 1.70489501953125, 1.759735107421875, 1.8145751953125, 1.869415283203125, 1.92425537109375, 1.979095458984375, 2.033935546875, 2.088775634765625, 2.14361572265625, 2.198455810546875, 2.2532958984375, 2.308135986328125, 2.36297607421875, 2.417816162109375, 2.47265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 6.0, 6.0, 14.0, 16.0, 19.0, 25.0, 30.0, 44.0, 48.0, 75.0, 76.0, 101.0, 79.0, 92.0, 70.0, 67.0, 53.0, 21.0, 29.0, 27.0, 21.0, 13.0, 11.0, 10.0, 7.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.368492126464844e-05, -8.103344589471817e-05, -7.83819705247879e-05, -7.573049515485764e-05, -7.307901978492737e-05, -7.04275444149971e-05, -6.777606904506683e-05, -6.512459367513657e-05, -6.24731183052063e-05, -5.982164293527603e-05, -5.7170167565345764e-05, -5.45186921954155e-05, -5.186721682548523e-05, -4.921574145555496e-05, -4.6564266085624695e-05, -4.391279071569443e-05, -4.126131534576416e-05, -3.860983997583389e-05, -3.5958364605903625e-05, -3.330688923597336e-05, -3.065541386604309e-05, -2.8003938496112823e-05, -2.5352463126182556e-05, -2.270098775625229e-05, -2.004951238632202e-05, -1.7398037016391754e-05, -1.4746561646461487e-05, -1.209508627653122e-05, -9.443610906600952e-06, -6.792135536670685e-06, -4.1406601667404175e-06, -1.4891847968101501e-06, 1.1622905731201172e-06, 3.8137659430503845e-06, 6.465241312980652e-06, 9.11671668291092e-06, 1.1768192052841187e-05, 1.4419667422771454e-05, 1.707114279270172e-05, 1.972261816263199e-05, 2.2374093532562256e-05, 2.5025568902492523e-05, 2.767704427242279e-05, 3.0328519642353058e-05, 3.2979995012283325e-05, 3.563147038221359e-05, 3.828294575214386e-05, 4.093442112207413e-05, 4.3585896492004395e-05, 4.623737186193466e-05, 4.888884723186493e-05, 5.1540322601795197e-05, 5.4191797971725464e-05, 5.684327334165573e-05, 5.9494748711586e-05, 6.214622408151627e-05, 6.479769945144653e-05, 6.74491748213768e-05, 7.010065019130707e-05, 7.275212556123734e-05, 7.54036009311676e-05, 7.805507630109787e-05, 8.070655167102814e-05, 8.33580270409584e-05, 8.600950241088867e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 15.0, 35.0, 42.0, 92.0, 184.0, 411.0, 1606.0, 14714.0, 1006623.0, 22033.0, 1913.0, 473.0, 172.0, 99.0, 51.0, 28.0, 18.0, 10.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.6323318481445312, -0.6093902587890625, -0.5864486694335938, -0.563507080078125, -0.5405654907226562, -0.5176239013671875, -0.49468231201171875, -0.47174072265625, -0.44879913330078125, -0.4258575439453125, -0.40291595458984375, -0.379974365234375, -0.35703277587890625, -0.3340911865234375, -0.31114959716796875, -0.2882080078125, -0.26526641845703125, -0.2423248291015625, -0.21938323974609375, -0.196441650390625, -0.17350006103515625, -0.1505584716796875, -0.12761688232421875, -0.10467529296875, -0.08173370361328125, -0.0587921142578125, -0.03585052490234375, -0.012908935546875, 0.01003265380859375, 0.0329742431640625, 0.05591583251953125, 0.078857421875, 0.10179901123046875, 0.1247406005859375, 0.14768218994140625, 0.170623779296875, 0.19356536865234375, 0.2165069580078125, 0.23944854736328125, 0.26239013671875, 0.28533172607421875, 0.3082733154296875, 0.33121490478515625, 0.354156494140625, 0.37709808349609375, 0.4000396728515625, 0.42298126220703125, 0.4459228515625, 0.46886444091796875, 0.4918060302734375, 0.5147476196289062, 0.537689208984375, 0.5606307983398438, 0.5835723876953125, 0.6065139770507812, 0.62945556640625, 0.6523971557617188, 0.6753387451171875, 0.6982803344726562, 0.721221923828125, 0.7441635131835938, 0.7671051025390625, 0.7900466918945312, 0.81298828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 6.0, 9.0, 18.0, 117.0, 447.0, 318.0, 51.0, 11.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5386962890625, -1.505126953125, -1.4715576171875, -1.43798828125, -1.4044189453125, -1.370849609375, -1.3372802734375, -1.3037109375, -1.2701416015625, -1.236572265625, -1.2030029296875, -1.16943359375, -1.1358642578125, -1.102294921875, -1.0687255859375, -1.03515625, -1.0015869140625, -0.968017578125, -0.9344482421875, -0.90087890625, -0.8673095703125, -0.833740234375, -0.8001708984375, -0.7666015625, -0.7330322265625, -0.699462890625, -0.6658935546875, -0.63232421875, -0.5987548828125, -0.565185546875, -0.5316162109375, -0.498046875, -0.4644775390625, -0.430908203125, -0.3973388671875, -0.36376953125, -0.3302001953125, -0.296630859375, -0.2630615234375, -0.2294921875, -0.1959228515625, -0.162353515625, -0.1287841796875, -0.09521484375, -0.0616455078125, -0.028076171875, 0.0054931640625, 0.0390625, 0.0726318359375, 0.106201171875, 0.1397705078125, 0.17333984375, 0.2069091796875, 0.240478515625, 0.2740478515625, 0.3076171875, 0.3411865234375, 0.374755859375, 0.4083251953125, 0.44189453125, 0.4754638671875, 0.509033203125, 0.5426025390625, 0.576171875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 19.0, 41.0, 177.0, 535.0, 190.0, 20.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.39830780029297, -21.948360443115234, -21.4984130859375, -21.0484676361084, -20.598520278930664, -20.14857292175293, -19.698625564575195, -19.248680114746094, -18.79873275756836, -18.348785400390625, -17.89883804321289, -17.44889259338379, -16.998945236206055, -16.54899787902832, -16.099050521850586, -15.649104118347168, -15.199156761169434, -14.7492094039917, -14.299263000488281, -13.849315643310547, -13.399369239807129, -12.949421882629395, -12.499475479125977, -12.049528121948242, -11.599580764770508, -11.149633407592773, -10.699687004089355, -10.249739646911621, -9.799793243408203, -9.349845886230469, -8.899898529052734, -8.449952125549316, -8.000005722045898, -7.550058841705322, -7.100111961364746, -6.650164604187012, -6.200218200683594, -5.750270843505859, -5.300323963165283, -4.850377082824707, -4.400430202484131, -3.9504833221435547, -3.5005364418029785, -3.0505893230438232, -2.600642442703247, -2.150695562362671, -1.7007484436035156, -1.2508015632629395, -0.8008546829223633, -0.35090774297714233, 0.09903919696807861, 0.5489861965179443, 0.9989330768585205, 1.4488799571990967, 1.898827075958252, 2.348773956298828, 2.7987208366394043, 3.2486677169799805, 3.6986145973205566, 4.148561477661133, 4.598508834838867, 5.048455238342285, 5.4984025955200195, 5.948349475860596, 6.398296356201172]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 9.0, 7.0, 6.0, 12.0, 8.0, 17.0, 17.0, 16.0, 20.0, 23.0, 26.0, 28.0, 32.0, 32.0, 37.0, 42.0, 44.0, 53.0, 45.0, 45.0, 53.0, 43.0, 42.0, 31.0, 37.0, 26.0, 29.0, 38.0, 29.0, 22.0, 25.0, 16.0, 13.0, 11.0, 11.0, 13.0, 15.0, 2.0, 1.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.7863407135009766, -3.668015480041504, -3.5496902465820312, -3.4313650131225586, -3.313039779663086, -3.1947145462036133, -3.0763893127441406, -2.958064079284668, -2.8397388458251953, -2.7214136123657227, -2.60308837890625, -2.4847631454467773, -2.3664379119873047, -2.248112678527832, -2.1297874450683594, -2.0114622116088867, -1.8931372165679932, -1.7748119831085205, -1.6564867496490479, -1.5381615161895752, -1.4198362827301025, -1.3015110492706299, -1.1831859350204468, -1.0648607015609741, -0.9465354681015015, -0.8282102346420288, -0.7098850011825562, -0.5915598273277283, -0.4732345938682556, -0.35490936040878296, -0.23658418655395508, -0.11825895309448242, 6.604194641113281e-05, 0.1183912605047226, 0.23671647906303406, 0.3550416827201843, 0.473366916179657, 0.5916921496391296, 0.7100173234939575, 0.8283425569534302, 0.9466677904129028, 1.0649930238723755, 1.1833182573318481, 1.3016433715820312, 1.419968605041504, 1.5382938385009766, 1.6566190719604492, 1.7749443054199219, 1.8932695388793945, 2.011594772338867, 2.12992000579834, 2.2482452392578125, 2.366570472717285, 2.484895706176758, 2.6032209396362305, 2.721546173095703, 2.839871406555176, 2.9581966400146484, 3.076521873474121, 3.1948471069335938, 3.3131723403930664, 3.431497573852539, 3.5498228073120117, 3.6681480407714844, 3.786473035812378]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 14.0, 21.0, 46.0, 84.0, 194.0, 534.0, 1476.0, 8628.0, 4133710.0, 45410.0, 2831.0, 779.0, 285.0, 120.0, 53.0, 32.0, 22.0, 17.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.83453369140625, -0.8082275390625, -0.78192138671875, -0.755615234375, -0.72930908203125, -0.7030029296875, -0.67669677734375, -0.650390625, -0.62408447265625, -0.5977783203125, -0.57147216796875, -0.545166015625, -0.51885986328125, -0.4925537109375, -0.46624755859375, -0.43994140625, -0.41363525390625, -0.3873291015625, -0.36102294921875, -0.334716796875, -0.30841064453125, -0.2821044921875, -0.25579833984375, -0.2294921875, -0.20318603515625, -0.1768798828125, -0.15057373046875, -0.124267578125, -0.09796142578125, -0.0716552734375, -0.04534912109375, -0.01904296875, 0.00726318359375, 0.0335693359375, 0.05987548828125, 0.086181640625, 0.11248779296875, 0.1387939453125, 0.16510009765625, 0.19140625, 0.21771240234375, 0.2440185546875, 0.27032470703125, 0.296630859375, 0.32293701171875, 0.3492431640625, 0.37554931640625, 0.40185546875, 0.42816162109375, 0.4544677734375, 0.48077392578125, 0.507080078125, 0.53338623046875, 0.5596923828125, 0.58599853515625, 0.6123046875, 0.63861083984375, 0.6649169921875, 0.69122314453125, 0.717529296875, 0.74383544921875, 0.7701416015625, 0.79644775390625, 0.82275390625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 2.0, 11.0, 11.0, 12.0, 10.0, 17.0, 24.0, 24.0, 25.0, 25.0, 37.0, 49.0, 41.0, 44.0, 61.0, 51.0, 65.0, 68.0, 57.0, 67.0, 45.0, 46.0, 30.0, 28.0, 27.0, 19.0, 16.0, 7.0, 13.0, 6.0, 7.0, 11.0, 5.0, 6.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.229248046875, -0.22238922119140625, -0.2155303955078125, -0.20867156982421875, -0.201812744140625, -0.19495391845703125, -0.1880950927734375, -0.18123626708984375, -0.17437744140625, -0.16751861572265625, -0.1606597900390625, -0.15380096435546875, -0.146942138671875, -0.14008331298828125, -0.1332244873046875, -0.12636566162109375, -0.1195068359375, -0.11264801025390625, -0.1057891845703125, -0.09893035888671875, -0.092071533203125, -0.08521270751953125, -0.0783538818359375, -0.07149505615234375, -0.06463623046875, -0.05777740478515625, -0.0509185791015625, -0.04405975341796875, -0.037200927734375, -0.03034210205078125, -0.0234832763671875, -0.01662445068359375, -0.009765625, -0.00290679931640625, 0.0039520263671875, 0.01081085205078125, 0.017669677734375, 0.02452850341796875, 0.0313873291015625, 0.03824615478515625, 0.04510498046875, 0.05196380615234375, 0.0588226318359375, 0.06568145751953125, 0.072540283203125, 0.07939910888671875, 0.0862579345703125, 0.09311676025390625, 0.0999755859375, 0.10683441162109375, 0.1136932373046875, 0.12055206298828125, 0.127410888671875, 0.13426971435546875, 0.1411285400390625, 0.14798736572265625, 0.15484619140625, 0.16170501708984375, 0.1685638427734375, 0.17542266845703125, 0.182281494140625, 0.18914031982421875, 0.1959991455078125, 0.20285797119140625, 0.209716796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 11.0, 19.0, 17.0, 18.0, 33.0, 56.0, 47.0, 68.0, 148.0, 370.0, 1227.0, 11815.0, 4168553.0, 9954.0, 1180.0, 357.0, 113.0, 54.0, 44.0, 51.0, 36.0, 24.0, 18.0, 24.0, 13.0, 9.0, 2.0, 6.0, 1.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.537109375, -1.494964599609375, -1.45281982421875, -1.410675048828125, -1.3685302734375, -1.326385498046875, -1.28424072265625, -1.242095947265625, -1.199951171875, -1.157806396484375, -1.11566162109375, -1.073516845703125, -1.0313720703125, -0.989227294921875, -0.94708251953125, -0.904937744140625, -0.86279296875, -0.820648193359375, -0.77850341796875, -0.736358642578125, -0.6942138671875, -0.652069091796875, -0.60992431640625, -0.567779541015625, -0.525634765625, -0.483489990234375, -0.44134521484375, -0.399200439453125, -0.3570556640625, -0.314910888671875, -0.27276611328125, -0.230621337890625, -0.1884765625, -0.146331787109375, -0.10418701171875, -0.062042236328125, -0.0198974609375, 0.022247314453125, 0.06439208984375, 0.106536865234375, 0.148681640625, 0.190826416015625, 0.23297119140625, 0.275115966796875, 0.3172607421875, 0.359405517578125, 0.40155029296875, 0.443695068359375, 0.48583984375, 0.527984619140625, 0.57012939453125, 0.612274169921875, 0.6544189453125, 0.696563720703125, 0.73870849609375, 0.780853271484375, 0.822998046875, 0.865142822265625, 0.90728759765625, 0.949432373046875, 0.9915771484375, 1.033721923828125, 1.07586669921875, 1.118011474609375, 1.16015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 27.0, 3703.0, 302.0, 34.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1875, -0.175689697265625, -0.16387939453125, -0.152069091796875, -0.1402587890625, -0.128448486328125, -0.11663818359375, -0.104827880859375, -0.093017578125, -0.081207275390625, -0.06939697265625, -0.057586669921875, -0.0457763671875, -0.033966064453125, -0.02215576171875, -0.010345458984375, 0.00146484375, 0.013275146484375, 0.02508544921875, 0.036895751953125, 0.0487060546875, 0.060516357421875, 0.07232666015625, 0.084136962890625, 0.095947265625, 0.107757568359375, 0.11956787109375, 0.131378173828125, 0.1431884765625, 0.154998779296875, 0.16680908203125, 0.178619384765625, 0.1904296875, 0.202239990234375, 0.21405029296875, 0.225860595703125, 0.2376708984375, 0.249481201171875, 0.26129150390625, 0.273101806640625, 0.284912109375, 0.296722412109375, 0.30853271484375, 0.320343017578125, 0.3321533203125, 0.343963623046875, 0.35577392578125, 0.367584228515625, 0.37939453125, 0.391204833984375, 0.40301513671875, 0.414825439453125, 0.4266357421875, 0.438446044921875, 0.45025634765625, 0.462066650390625, 0.473876953125, 0.485687255859375, 0.49749755859375, 0.509307861328125, 0.5211181640625, 0.532928466796875, 0.54473876953125, 0.556549072265625, 0.568359375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 24.0, 291.0, 522.0, 127.0, 21.0, 9.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3711837530136108, -1.3162442445755005, -1.2613046169281006, -1.2063651084899902, -1.1514256000518799, -1.09648597240448, -1.0415464639663696, -0.9866068959236145, -0.9316673278808594, -0.8767277598381042, -0.8217881917953491, -0.7668486833572388, -0.7119091153144836, -0.6569695472717285, -0.6020300388336182, -0.547090470790863, -0.4921509027481079, -0.4372113347053528, -0.38227179646492004, -0.3273322582244873, -0.2723926901817322, -0.21745312213897705, -0.1625135838985443, -0.10757404565811157, -0.052634477615356445, 0.002305075526237488, 0.05724462866783142, 0.11218418180942535, 0.1671237349510193, 0.22206330299377441, 0.27700284123420715, 0.3319423794746399, 0.38688182830810547, 0.4418213963508606, 0.49676093459129333, 0.5517004728317261, 0.6066400408744812, 0.6615796089172363, 0.7165191173553467, 0.7714586853981018, 0.8263982534408569, 0.8813378214836121, 0.9362773895263672, 0.9912168979644775, 1.046156406402588, 1.1010960340499878, 1.1560355424880981, 1.210975170135498, 1.2659146785736084, 1.3208541870117188, 1.3757938146591187, 1.430733323097229, 1.485672950744629, 1.5406124591827393, 1.5955519676208496, 1.65049147605896, 1.7054311037063599, 1.7603706121444702, 1.8153102397918701, 1.8702497482299805, 1.9251892566680908, 1.9801288843154907, 2.0350685119628906, 2.090008020401001, 2.1449475288391113]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 12.0, 11.0, 16.0, 23.0, 26.0, 32.0, 33.0, 39.0, 54.0, 49.0, 64.0, 57.0, 53.0, 52.0, 49.0, 51.0, 67.0, 47.0, 48.0, 44.0, 44.0, 31.0, 19.0, 18.0, 15.0, 15.0, 6.0, 8.0, 1.0, 5.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4719772934913635, -0.45801466703414917, -0.4440520107746124, -0.43008938431739807, -0.41612672805786133, -0.402164101600647, -0.3882014751434326, -0.3742388188838959, -0.36027616262435913, -0.3463135361671448, -0.33235087990760803, -0.3183882534503937, -0.30442559719085693, -0.2904629707336426, -0.2765003442764282, -0.2625376880168915, -0.24857506155967712, -0.23461242020130157, -0.22064977884292603, -0.20668715238571167, -0.19272449612617493, -0.17876186966896057, -0.16479922831058502, -0.15083658695220947, -0.13687394559383392, -0.12291130423545837, -0.10894866287708282, -0.09498602896928787, -0.08102338761091232, -0.06706074625253677, -0.05309811234474182, -0.03913547098636627, -0.025172829627990723, -0.011210190132260323, 0.0027524493634700775, 0.01671508699655533, 0.030677728354930878, 0.04464036971330643, 0.05860300362110138, 0.07256564497947693, 0.08652828633785248, 0.10049092769622803, 0.11445356905460358, 0.12841621041297913, 0.14237883687019348, 0.15634149312973022, 0.17030411958694458, 0.18426676094532013, 0.19822940230369568, 0.21219204366207123, 0.22615468502044678, 0.24011731147766113, 0.2540799677371979, 0.26804259419441223, 0.282005250453949, 0.29596787691116333, 0.3099305033683777, 0.32389312982559204, 0.3378557860851288, 0.35181841254234314, 0.3657810688018799, 0.37974369525909424, 0.3937063217163086, 0.40766897797584534, 0.4216316342353821]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 9.0, 13.0, 12.0, 23.0, 48.0, 59.0, 96.0, 188.0, 267.0, 377.0, 663.0, 1289.0, 2434.0, 4851.0, 10532.0, 25230.0, 69480.0, 214143.0, 404117.0, 203894.0, 66562.0, 24173.0, 10021.0, 4692.0, 2323.0, 1202.0, 733.0, 419.0, 226.0, 155.0, 108.0, 61.0, 49.0, 26.0, 27.0, 14.0, 11.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23779296875, -0.23069000244140625, -0.2235870361328125, -0.21648406982421875, -0.209381103515625, -0.20227813720703125, -0.1951751708984375, -0.18807220458984375, -0.18096923828125, -0.17386627197265625, -0.1667633056640625, -0.15966033935546875, -0.152557373046875, -0.14545440673828125, -0.1383514404296875, -0.13124847412109375, -0.1241455078125, -0.11704254150390625, -0.1099395751953125, -0.10283660888671875, -0.095733642578125, -0.08863067626953125, -0.0815277099609375, -0.07442474365234375, -0.06732177734375, -0.06021881103515625, -0.0531158447265625, -0.04601287841796875, -0.038909912109375, -0.03180694580078125, -0.0247039794921875, -0.01760101318359375, -0.010498046875, -0.00339508056640625, 0.0037078857421875, 0.01081085205078125, 0.017913818359375, 0.02501678466796875, 0.0321197509765625, 0.03922271728515625, 0.04632568359375, 0.05342864990234375, 0.0605316162109375, 0.06763458251953125, 0.074737548828125, 0.08184051513671875, 0.0889434814453125, 0.09604644775390625, 0.1031494140625, 0.11025238037109375, 0.1173553466796875, 0.12445831298828125, 0.131561279296875, 0.13866424560546875, 0.1457672119140625, 0.15287017822265625, 0.15997314453125, 0.16707611083984375, 0.1741790771484375, 0.18128204345703125, 0.188385009765625, 0.19548797607421875, 0.2025909423828125, 0.20969390869140625, 0.216796875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 5.0, 9.0, 6.0, 12.0, 12.0, 15.0, 22.0, 22.0, 28.0, 31.0, 40.0, 42.0, 55.0, 43.0, 41.0, 57.0, 67.0, 66.0, 61.0, 54.0, 45.0, 40.0, 38.0, 40.0, 32.0, 25.0, 12.0, 10.0, 14.0, 13.0, 7.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23095703125, -0.22406387329101562, -0.21717071533203125, -0.21027755737304688, -0.2033843994140625, -0.19649124145507812, -0.18959808349609375, -0.18270492553710938, -0.175811767578125, -0.16891860961914062, -0.16202545166015625, -0.15513229370117188, -0.1482391357421875, -0.14134597778320312, -0.13445281982421875, -0.12755966186523438, -0.12066650390625, -0.11377334594726562, -0.10688018798828125, -0.09998703002929688, -0.0930938720703125, -0.08620071411132812, -0.07930755615234375, -0.07241439819335938, -0.065521240234375, -0.058628082275390625, -0.05173492431640625, -0.044841766357421875, -0.0379486083984375, -0.031055450439453125, -0.02416229248046875, -0.017269134521484375, -0.0103759765625, -0.003482818603515625, 0.00341033935546875, 0.010303497314453125, 0.0171966552734375, 0.024089813232421875, 0.03098297119140625, 0.037876129150390625, 0.044769287109375, 0.051662445068359375, 0.05855560302734375, 0.06544876098632812, 0.0723419189453125, 0.07923507690429688, 0.08612823486328125, 0.09302139282226562, 0.09991455078125, 0.10680770874023438, 0.11370086669921875, 0.12059402465820312, 0.1274871826171875, 0.13438034057617188, 0.14127349853515625, 0.14816665649414062, 0.155059814453125, 0.16195297241210938, 0.16884613037109375, 0.17573928833007812, 0.1826324462890625, 0.18952560424804688, 0.19641876220703125, 0.20331192016601562, 0.210205078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 9.0, 5.0, 10.0, 11.0, 12.0, 25.0, 20.0, 29.0, 39.0, 49.0, 82.0, 103.0, 153.0, 203.0, 325.0, 550.0, 952.0, 1935.0, 5508.0, 23968.0, 221918.0, 693507.0, 79996.0, 12216.0, 3496.0, 1405.0, 732.0, 417.0, 291.0, 176.0, 105.0, 83.0, 40.0, 52.0, 35.0, 29.0, 18.0, 16.0, 13.0, 2.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.42333984375, -0.40981292724609375, -0.3962860107421875, -0.38275909423828125, -0.369232177734375, -0.35570526123046875, -0.3421783447265625, -0.32865142822265625, -0.31512451171875, -0.30159759521484375, -0.2880706787109375, -0.27454376220703125, -0.261016845703125, -0.24748992919921875, -0.2339630126953125, -0.22043609619140625, -0.2069091796875, -0.19338226318359375, -0.1798553466796875, -0.16632843017578125, -0.152801513671875, -0.13927459716796875, -0.1257476806640625, -0.11222076416015625, -0.09869384765625, -0.08516693115234375, -0.0716400146484375, -0.05811309814453125, -0.044586181640625, -0.03105926513671875, -0.0175323486328125, -0.00400543212890625, 0.009521484375, 0.02304840087890625, 0.0365753173828125, 0.05010223388671875, 0.063629150390625, 0.07715606689453125, 0.0906829833984375, 0.10420989990234375, 0.11773681640625, 0.13126373291015625, 0.1447906494140625, 0.15831756591796875, 0.171844482421875, 0.18537139892578125, 0.1988983154296875, 0.21242523193359375, 0.2259521484375, 0.23947906494140625, 0.2530059814453125, 0.26653289794921875, 0.280059814453125, 0.29358673095703125, 0.3071136474609375, 0.32064056396484375, 0.33416748046875, 0.34769439697265625, 0.3612213134765625, 0.37474822998046875, 0.388275146484375, 0.40180206298828125, 0.4153289794921875, 0.42885589599609375, 0.4423828125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 13.0, 7.0, 14.0, 20.0, 14.0, 24.0, 26.0, 26.0, 28.0, 41.0, 38.0, 42.0, 43.0, 55.0, 47.0, 53.0, 41.0, 54.0, 37.0, 42.0, 31.0, 39.0, 39.0, 29.0, 28.0, 31.0, 24.0, 14.0, 18.0, 12.0, 9.0, 11.0, 3.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.994140625, -0.9647750854492188, -0.9354095458984375, -0.9060440063476562, -0.876678466796875, -0.8473129272460938, -0.8179473876953125, -0.7885818481445312, -0.75921630859375, -0.7298507690429688, -0.7004852294921875, -0.6711196899414062, -0.641754150390625, -0.6123886108398438, -0.5830230712890625, -0.5536575317382812, -0.5242919921875, -0.49492645263671875, -0.4655609130859375, -0.43619537353515625, -0.406829833984375, -0.37746429443359375, -0.3480987548828125, -0.31873321533203125, -0.28936767578125, -0.26000213623046875, -0.2306365966796875, -0.20127105712890625, -0.171905517578125, -0.14253997802734375, -0.1131744384765625, -0.08380889892578125, -0.054443359375, -0.02507781982421875, 0.0042877197265625, 0.03365325927734375, 0.063018798828125, 0.09238433837890625, 0.1217498779296875, 0.15111541748046875, 0.18048095703125, 0.20984649658203125, 0.2392120361328125, 0.26857757568359375, 0.297943115234375, 0.32730865478515625, 0.3566741943359375, 0.38603973388671875, 0.4154052734375, 0.44477081298828125, 0.4741363525390625, 0.5035018920898438, 0.532867431640625, 0.5622329711914062, 0.5915985107421875, 0.6209640502929688, 0.65032958984375, 0.6796951293945312, 0.7090606689453125, 0.7384262084960938, 0.767791748046875, 0.7971572875976562, 0.8265228271484375, 0.8558883666992188, 0.88525390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 9.0, 10.0, 28.0, 42.0, 111.0, 512.0, 9398.0, 1029636.0, 8062.0, 554.0, 109.0, 30.0, 18.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.15234375, -1.1238784790039062, -1.0954132080078125, -1.0669479370117188, -1.038482666015625, -1.0100173950195312, -0.9815521240234375, -0.9530868530273438, -0.92462158203125, -0.8961563110351562, -0.8676910400390625, -0.8392257690429688, -0.810760498046875, -0.7822952270507812, -0.7538299560546875, -0.7253646850585938, -0.6968994140625, -0.6684341430664062, -0.6399688720703125, -0.6115036010742188, -0.583038330078125, -0.5545730590820312, -0.5261077880859375, -0.49764251708984375, -0.46917724609375, -0.44071197509765625, -0.4122467041015625, -0.38378143310546875, -0.355316162109375, -0.32685089111328125, -0.2983856201171875, -0.26992034912109375, -0.241455078125, -0.21298980712890625, -0.1845245361328125, -0.15605926513671875, -0.127593994140625, -0.09912872314453125, -0.0706634521484375, -0.04219818115234375, -0.01373291015625, 0.01473236083984375, 0.0431976318359375, 0.07166290283203125, 0.100128173828125, 0.12859344482421875, 0.1570587158203125, 0.18552398681640625, 0.2139892578125, 0.24245452880859375, 0.2709197998046875, 0.29938507080078125, 0.327850341796875, 0.35631561279296875, 0.3847808837890625, 0.41324615478515625, 0.44171142578125, 0.47017669677734375, 0.4986419677734375, 0.5271072387695312, 0.555572509765625, 0.5840377807617188, 0.6125030517578125, 0.6409683227539062, 0.66943359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 8.0, 5.0, 7.0, 8.0, 12.0, 9.0, 10.0, 20.0, 29.0, 31.0, 44.0, 63.0, 75.0, 112.0, 103.0, 109.0, 91.0, 64.0, 41.0, 30.0, 21.0, 15.0, 14.0, 8.0, 11.0, 12.0, 14.0, 3.0, 7.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.341934204101562e-05, -6.103515625e-05, -5.8650970458984375e-05, -5.626678466796875e-05, -5.3882598876953125e-05, -5.14984130859375e-05, -4.9114227294921875e-05, -4.673004150390625e-05, -4.4345855712890625e-05, -4.1961669921875e-05, -3.9577484130859375e-05, -3.719329833984375e-05, -3.4809112548828125e-05, -3.24249267578125e-05, -3.0040740966796875e-05, -2.765655517578125e-05, -2.5272369384765625e-05, -2.288818359375e-05, -2.0503997802734375e-05, -1.811981201171875e-05, -1.5735626220703125e-05, -1.33514404296875e-05, -1.0967254638671875e-05, -8.58306884765625e-06, -6.198883056640625e-06, -3.814697265625e-06, -1.430511474609375e-06, 9.5367431640625e-07, 3.337860107421875e-06, 5.7220458984375e-06, 8.106231689453125e-06, 1.049041748046875e-05, 1.2874603271484375e-05, 1.52587890625e-05, 1.7642974853515625e-05, 2.002716064453125e-05, 2.2411346435546875e-05, 2.47955322265625e-05, 2.7179718017578125e-05, 2.956390380859375e-05, 3.1948089599609375e-05, 3.4332275390625e-05, 3.6716461181640625e-05, 3.910064697265625e-05, 4.1484832763671875e-05, 4.38690185546875e-05, 4.6253204345703125e-05, 4.863739013671875e-05, 5.1021575927734375e-05, 5.340576171875e-05, 5.5789947509765625e-05, 5.817413330078125e-05, 6.0558319091796875e-05, 6.29425048828125e-05, 6.532669067382812e-05, 6.771087646484375e-05, 7.009506225585938e-05, 7.2479248046875e-05, 7.486343383789062e-05, 7.724761962890625e-05, 7.963180541992188e-05, 8.20159912109375e-05, 8.440017700195312e-05, 8.678436279296875e-05, 8.916854858398438e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 7.0, 11.0, 8.0, 11.0, 17.0, 23.0, 38.0, 60.0, 89.0, 143.0, 285.0, 570.0, 1457.0, 4801.0, 31202.0, 691646.0, 296793.0, 16125.0, 3172.0, 1089.0, 427.0, 218.0, 122.0, 76.0, 53.0, 34.0, 25.0, 16.0, 13.0, 5.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.272216796875, -0.2644062042236328, -0.2565956115722656, -0.24878501892089844, -0.24097442626953125, -0.23316383361816406, -0.22535324096679688, -0.2175426483154297, -0.2097320556640625, -0.2019214630126953, -0.19411087036132812, -0.18630027770996094, -0.17848968505859375, -0.17067909240722656, -0.16286849975585938, -0.1550579071044922, -0.147247314453125, -0.1394367218017578, -0.13162612915039062, -0.12381553649902344, -0.11600494384765625, -0.10819435119628906, -0.10038375854492188, -0.09257316589355469, -0.0847625732421875, -0.07695198059082031, -0.06914138793945312, -0.06133079528808594, -0.05352020263671875, -0.04570960998535156, -0.037899017333984375, -0.030088424682617188, -0.02227783203125, -0.014467239379882812, -0.006656646728515625, 0.0011539459228515625, 0.00896453857421875, 0.016775131225585938, 0.024585723876953125, 0.03239631652832031, 0.0402069091796875, 0.04801750183105469, 0.055828094482421875, 0.06363868713378906, 0.07144927978515625, 0.07925987243652344, 0.08707046508789062, 0.09488105773925781, 0.102691650390625, 0.11050224304199219, 0.11831283569335938, 0.12612342834472656, 0.13393402099609375, 0.14174461364746094, 0.14955520629882812, 0.1573657989501953, 0.1651763916015625, 0.1729869842529297, 0.18079757690429688, 0.18860816955566406, 0.19641876220703125, 0.20422935485839844, 0.21203994750976562, 0.2198505401611328, 0.2276611328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 11.0, 37.0, 44.0, 82.0, 107.0, 158.0, 165.0, 127.0, 98.0, 66.0, 25.0, 19.0, 14.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4384765625, -0.4256553649902344, -0.41283416748046875, -0.4000129699707031, -0.3871917724609375, -0.3743705749511719, -0.36154937744140625, -0.3487281799316406, -0.335906982421875, -0.3230857849121094, -0.31026458740234375, -0.2974433898925781, -0.2846221923828125, -0.2718009948730469, -0.25897979736328125, -0.24615859985351562, -0.23333740234375, -0.22051620483398438, -0.20769500732421875, -0.19487380981445312, -0.1820526123046875, -0.16923141479492188, -0.15641021728515625, -0.14358901977539062, -0.130767822265625, -0.11794662475585938, -0.10512542724609375, -0.09230422973632812, -0.0794830322265625, -0.06666183471679688, -0.05384063720703125, -0.041019439697265625, -0.0281982421875, -0.015377044677734375, -0.00255584716796875, 0.010265350341796875, 0.0230865478515625, 0.035907745361328125, 0.04872894287109375, 0.061550140380859375, 0.074371337890625, 0.08719253540039062, 0.10001373291015625, 0.11283493041992188, 0.1256561279296875, 0.13847732543945312, 0.15129852294921875, 0.16411972045898438, 0.17694091796875, 0.18976211547851562, 0.20258331298828125, 0.21540451049804688, 0.2282257080078125, 0.24104690551757812, 0.25386810302734375, 0.2666893005371094, 0.279510498046875, 0.2923316955566406, 0.30515289306640625, 0.3179740905761719, 0.3307952880859375, 0.3436164855957031, 0.35643768310546875, 0.3692588806152344, 0.382080078125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 22.0, 50.0, 150.0, 305.0, 285.0, 135.0, 32.0, 9.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.243878364562988, -7.036629676818848, -6.829380989074707, -6.622132301330566, -6.414883613586426, -6.207634925842285, -6.0003862380981445, -5.793137550354004, -5.585888862609863, -5.378640174865723, -5.171391487121582, -4.964142799377441, -4.756894111633301, -4.54964542388916, -4.3423967361450195, -4.135148048400879, -3.9278995990753174, -3.7206509113311768, -3.513402223587036, -3.3061535358428955, -3.098904848098755, -2.8916563987731934, -2.6844077110290527, -2.477159023284912, -2.2699103355407715, -2.062661647796631, -1.8554129600524902, -1.6481642723083496, -1.440915584564209, -1.233667016029358, -1.0264183282852173, -0.8191696405410767, -0.6119208335876465, -0.40467214584350586, -0.19742348790168762, 0.009825170040130615, 0.21707385778427124, 0.4243224859237671, 0.6315711736679077, 0.8388198614120483, 1.046068549156189, 1.2533172369003296, 1.4605659246444702, 1.6678144931793213, 1.875063180923462, 2.0823118686676025, 2.289560556411743, 2.496809244155884, 2.7040579319000244, 2.911306619644165, 3.1185553073883057, 3.3258039951324463, 3.533052682876587, 3.7403011322021484, 3.947549819946289, 4.15479850769043, 4.36204719543457, 4.569295883178711, 4.776544570922852, 4.983793258666992, 5.191041946411133, 5.398290634155273, 5.605539321899414, 5.812788009643555, 6.020036697387695]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 5.0, 8.0, 8.0, 11.0, 12.0, 9.0, 11.0, 18.0, 24.0, 17.0, 29.0, 23.0, 27.0, 22.0, 37.0, 50.0, 43.0, 42.0, 53.0, 53.0, 42.0, 44.0, 49.0, 47.0, 45.0, 29.0, 27.0, 25.0, 31.0, 24.0, 22.0, 15.0, 17.0, 14.0, 18.0, 6.0, 7.0, 7.0, 4.0, 3.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.311081886291504, -4.176558971405029, -4.042036056518555, -3.90751314163208, -3.7729902267456055, -3.638467311859131, -3.503944158554077, -3.3694212436676025, -3.234898328781128, -3.1003754138946533, -2.9658524990081787, -2.831329584121704, -2.6968064308166504, -2.562283515930176, -2.427760601043701, -2.2932376861572266, -2.158714771270752, -2.0241918563842773, -1.8896689414978027, -1.7551459074020386, -1.620622992515564, -1.4861000776290894, -1.3515770435333252, -1.2170541286468506, -1.082531213760376, -0.9480082988739014, -0.813485324382782, -0.6789623498916626, -0.544439435005188, -0.4099165201187134, -0.275393545627594, -0.1408705711364746, -0.006347179412841797, 0.1281757652759552, 0.2626987099647522, 0.3972216546535492, 0.5317445993423462, 0.6662675142288208, 0.8007904887199402, 0.9353134632110596, 1.0698363780975342, 1.2043592929840088, 1.3388822078704834, 1.4734052419662476, 1.6079281568527222, 1.7424510717391968, 1.876974105834961, 2.0114970207214355, 2.14601993560791, 2.2805428504943848, 2.4150657653808594, 2.549588680267334, 2.6841115951538086, 2.818634510040283, 2.953157663345337, 3.0876805782318115, 3.222203493118286, 3.3567264080047607, 3.4912493228912354, 3.62577223777771, 3.7602953910827637, 3.8948183059692383, 4.029341220855713, 4.1638641357421875, 4.298387050628662]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 9.0, 6.0, 19.0, 21.0, 35.0, 32.0, 70.0, 106.0, 210.0, 407.0, 946.0, 3677.0, 33943.0, 4091754.0, 55981.0, 4798.0, 1211.0, 448.0, 227.0, 133.0, 79.0, 45.0, 37.0, 21.0, 18.0, 7.0, 5.0, 7.0, 4.0, 3.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.480224609375, -0.4614448547363281, -0.44266510009765625, -0.4238853454589844, -0.4051055908203125, -0.3863258361816406, -0.36754608154296875, -0.3487663269042969, -0.329986572265625, -0.3112068176269531, -0.29242706298828125, -0.2736473083496094, -0.2548675537109375, -0.23608779907226562, -0.21730804443359375, -0.19852828979492188, -0.17974853515625, -0.16096878051757812, -0.14218902587890625, -0.12340927124023438, -0.1046295166015625, -0.08584976196289062, -0.06707000732421875, -0.048290252685546875, -0.029510498046875, -0.010730743408203125, 0.00804901123046875, 0.026828765869140625, 0.0456085205078125, 0.06438827514648438, 0.08316802978515625, 0.10194778442382812, 0.1207275390625, 0.13950729370117188, 0.15828704833984375, 0.17706680297851562, 0.1958465576171875, 0.21462631225585938, 0.23340606689453125, 0.2521858215332031, 0.270965576171875, 0.2897453308105469, 0.30852508544921875, 0.3273048400878906, 0.3460845947265625, 0.3648643493652344, 0.38364410400390625, 0.4024238586425781, 0.42120361328125, 0.4399833679199219, 0.45876312255859375, 0.4775428771972656, 0.4963226318359375, 0.5151023864746094, 0.5338821411132812, 0.5526618957519531, 0.571441650390625, 0.5902214050292969, 0.6090011596679688, 0.6277809143066406, 0.6465606689453125, 0.6653404235839844, 0.6841201782226562, 0.7028999328613281, 0.7216796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 10.0, 17.0, 22.0, 16.0, 36.0, 39.0, 52.0, 62.0, 57.0, 74.0, 72.0, 84.0, 84.0, 72.0, 66.0, 52.0, 30.0, 29.0, 21.0, 17.0, 10.0, 15.0, 9.0, 10.0, 4.0, 1.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2939453125, -0.28488922119140625, -0.2758331298828125, -0.26677703857421875, -0.257720947265625, -0.24866485595703125, -0.2396087646484375, -0.23055267333984375, -0.22149658203125, -0.21244049072265625, -0.2033843994140625, -0.19432830810546875, -0.185272216796875, -0.17621612548828125, -0.1671600341796875, -0.15810394287109375, -0.1490478515625, -0.13999176025390625, -0.1309356689453125, -0.12187957763671875, -0.112823486328125, -0.10376739501953125, -0.0947113037109375, -0.08565521240234375, -0.07659912109375, -0.06754302978515625, -0.0584869384765625, -0.04943084716796875, -0.040374755859375, -0.03131866455078125, -0.0222625732421875, -0.01320648193359375, -0.004150390625, 0.00490570068359375, 0.0139617919921875, 0.02301788330078125, 0.032073974609375, 0.04113006591796875, 0.0501861572265625, 0.05924224853515625, 0.06829833984375, 0.07735443115234375, 0.0864105224609375, 0.09546661376953125, 0.104522705078125, 0.11357879638671875, 0.1226348876953125, 0.13169097900390625, 0.1407470703125, 0.14980316162109375, 0.1588592529296875, 0.16791534423828125, 0.176971435546875, 0.18602752685546875, 0.1950836181640625, 0.20413970947265625, 0.21319580078125, 0.22225189208984375, 0.2313079833984375, 0.24036407470703125, 0.249420166015625, 0.25847625732421875, 0.2675323486328125, 0.27658843994140625, 0.28564453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 11.0, 13.0, 17.0, 23.0, 24.0, 37.0, 47.0, 65.0, 92.0, 83.0, 118.0, 125.0, 150.0, 159.0, 206.0, 388.0, 9716.0, 4181005.0, 724.0, 270.0, 182.0, 158.0, 144.0, 92.0, 81.0, 81.0, 66.0, 45.0, 29.0, 22.0, 22.0, 22.0, 17.0, 9.0, 5.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.708984375, -3.597320556640625, -3.48565673828125, -3.373992919921875, -3.2623291015625, -3.150665283203125, -3.03900146484375, -2.927337646484375, -2.815673828125, -2.704010009765625, -2.59234619140625, -2.480682373046875, -2.3690185546875, -2.257354736328125, -2.14569091796875, -2.034027099609375, -1.92236328125, -1.810699462890625, -1.69903564453125, -1.587371826171875, -1.4757080078125, -1.364044189453125, -1.25238037109375, -1.140716552734375, -1.029052734375, -0.917388916015625, -0.80572509765625, -0.694061279296875, -0.5823974609375, -0.470733642578125, -0.35906982421875, -0.247406005859375, -0.1357421875, -0.024078369140625, 0.08758544921875, 0.199249267578125, 0.3109130859375, 0.422576904296875, 0.53424072265625, 0.645904541015625, 0.757568359375, 0.869232177734375, 0.98089599609375, 1.092559814453125, 1.2042236328125, 1.315887451171875, 1.42755126953125, 1.539215087890625, 1.65087890625, 1.762542724609375, 1.87420654296875, 1.985870361328125, 2.0975341796875, 2.209197998046875, 2.32086181640625, 2.432525634765625, 2.544189453125, 2.655853271484375, 2.76751708984375, 2.879180908203125, 2.9908447265625, 3.102508544921875, 3.21417236328125, 3.325836181640625, 3.4375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 249.0, 3829.0, 7.0, 1.0, 0.0, 1.0], "bins": [-4.125, -4.055194854736328, -3.9853897094726562, -3.9155845642089844, -3.8457794189453125, -3.7759742736816406, -3.7061691284179688, -3.636363983154297, -3.566558837890625, -3.496753692626953, -3.4269485473632812, -3.3571434020996094, -3.2873382568359375, -3.2175331115722656, -3.1477279663085938, -3.077922821044922, -3.00811767578125, -2.938312530517578, -2.8685073852539062, -2.7987022399902344, -2.7288970947265625, -2.6590919494628906, -2.5892868041992188, -2.519481658935547, -2.449676513671875, -2.379871368408203, -2.3100662231445312, -2.2402610778808594, -2.1704559326171875, -2.1006507873535156, -2.0308456420898438, -1.9610404968261719, -1.8912353515625, -1.8214302062988281, -1.7516250610351562, -1.6818199157714844, -1.6120147705078125, -1.5422096252441406, -1.4724044799804688, -1.4025993347167969, -1.332794189453125, -1.2629890441894531, -1.1931838989257812, -1.1233787536621094, -1.0535736083984375, -0.9837684631347656, -0.9139633178710938, -0.8441581726074219, -0.77435302734375, -0.7045478820800781, -0.6347427368164062, -0.5649375915527344, -0.4951324462890625, -0.4253273010253906, -0.35552215576171875, -0.2857170104980469, -0.215911865234375, -0.14610671997070312, -0.07630157470703125, -0.006496429443359375, 0.0633087158203125, 0.13311386108398438, 0.20291900634765625, 0.2727241516113281, 0.342529296875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 30.0, 225.0, 634.0, 92.0, 15.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-15.436528205871582, -15.161609649658203, -14.886691093444824, -14.611773490905762, -14.336854934692383, -14.061936378479004, -13.787017822265625, -13.512100219726562, -13.237181663513184, -12.962263107299805, -12.687344551086426, -12.412426948547363, -12.137508392333984, -11.862589836120605, -11.587671279907227, -11.312753677368164, -11.037834167480469, -10.76291561126709, -10.487997055053711, -10.213079452514648, -9.93816089630127, -9.66324234008789, -9.388323783874512, -9.113405227661133, -8.83848762512207, -8.563569068908691, -8.288650512695312, -8.01373291015625, -7.738814353942871, -7.463895797729492, -7.188977241516113, -6.914059162139893, -6.63914155960083, -6.364223003387451, -6.0893049240112305, -5.814386367797852, -5.539468288421631, -5.264549732208252, -4.989631652832031, -4.714713096618652, -4.439794540405273, -4.1648759841918945, -3.889957904815674, -3.615039348602295, -3.340121269226074, -3.0652027130126953, -2.7902843952178955, -2.5153660774230957, -2.240447998046875, -1.9655296802520752, -1.6906113624572754, -1.415692925453186, -1.1407746076583862, -0.8658562898635864, -0.5909378528594971, -0.31601953506469727, -0.04110121726989746, 0.23381713032722473, 0.5087354779243469, 0.7836538553237915, 1.0585721731185913, 1.3334904909133911, 1.6084089279174805, 1.8833272457122803, 2.15824556350708]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 23.0, 25.0, 33.0, 66.0, 78.0, 99.0, 165.0, 153.0, 121.0, 88.0, 45.0, 25.0, 24.0, 17.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.094334602355957, -5.877405166625977, -5.660475730895996, -5.443546295166016, -5.226616859436035, -5.009687423706055, -4.792757987976074, -4.575828552246094, -4.358899116516113, -4.141969680786133, -3.9250402450561523, -3.708110809326172, -3.4911813735961914, -3.274251937866211, -3.0573225021362305, -2.84039306640625, -2.6234633922576904, -2.40653395652771, -2.1896045207977295, -1.972675085067749, -1.7557456493377686, -1.5388160943984985, -1.321886658668518, -1.1049572229385376, -0.8880277872085571, -0.6710983514785767, -0.4541688859462738, -0.23723942041397095, -0.02030998468399048, 0.19661951065063477, 0.41354894638061523, 0.6304783821105957, 0.8474078178405762, 1.0643372535705566, 1.281266689300537, 1.4981961250305176, 1.715125560760498, 1.932055115699768, 2.148984432220459, 2.3659138679504395, 2.58284330368042, 2.7997727394104004, 3.016702175140381, 3.2336316108703613, 3.450561046600342, 3.6674904823303223, 3.8844199180603027, 4.101349353790283, 4.318279266357422, 4.535208702087402, 4.752138137817383, 4.969067573547363, 5.185997009277344, 5.402926445007324, 5.619855880737305, 5.836785316467285, 6.053714752197266, 6.270644187927246, 6.487573623657227, 6.704503059387207, 6.9214324951171875, 7.138361930847168, 7.355291366577148, 7.572220802307129, 7.789150238037109]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 12.0, 15.0, 25.0, 28.0, 53.0, 80.0, 141.0, 256.0, 433.0, 840.0, 2154.0, 6479.0, 27877.0, 233341.0, 677445.0, 78909.0, 13862.0, 3763.0, 1387.0, 622.0, 317.0, 192.0, 116.0, 62.0, 50.0, 22.0, 19.0, 14.0, 8.0, 5.0, 4.0, 0.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.69287109375, -0.6714019775390625, -0.649932861328125, -0.6284637451171875, -0.60699462890625, -0.5855255126953125, -0.564056396484375, -0.5425872802734375, -0.5211181640625, -0.4996490478515625, -0.478179931640625, -0.4567108154296875, -0.43524169921875, -0.4137725830078125, -0.392303466796875, -0.3708343505859375, -0.349365234375, -0.3278961181640625, -0.306427001953125, -0.2849578857421875, -0.26348876953125, -0.2420196533203125, -0.220550537109375, -0.1990814208984375, -0.1776123046875, -0.1561431884765625, -0.134674072265625, -0.1132049560546875, -0.09173583984375, -0.0702667236328125, -0.048797607421875, -0.0273284912109375, -0.005859375, 0.0156097412109375, 0.037078857421875, 0.0585479736328125, 0.08001708984375, 0.1014862060546875, 0.122955322265625, 0.1444244384765625, 0.1658935546875, 0.1873626708984375, 0.208831787109375, 0.2303009033203125, 0.25177001953125, 0.2732391357421875, 0.294708251953125, 0.3161773681640625, 0.337646484375, 0.3591156005859375, 0.380584716796875, 0.4020538330078125, 0.42352294921875, 0.4449920654296875, 0.466461181640625, 0.4879302978515625, 0.5093994140625, 0.5308685302734375, 0.552337646484375, 0.5738067626953125, 0.59527587890625, 0.6167449951171875, 0.638214111328125, 0.6596832275390625, 0.68115234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 4.0, 8.0, 11.0, 8.0, 28.0, 29.0, 32.0, 36.0, 55.0, 63.0, 78.0, 84.0, 92.0, 97.0, 80.0, 71.0, 63.0, 44.0, 31.0, 26.0, 14.0, 12.0, 11.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5005340576171875, -0.483001708984375, -0.4654693603515625, -0.44793701171875, -0.4304046630859375, -0.412872314453125, -0.3953399658203125, -0.3778076171875, -0.3602752685546875, -0.342742919921875, -0.3252105712890625, -0.30767822265625, -0.2901458740234375, -0.272613525390625, -0.2550811767578125, -0.237548828125, -0.2200164794921875, -0.202484130859375, -0.1849517822265625, -0.16741943359375, -0.1498870849609375, -0.132354736328125, -0.1148223876953125, -0.0972900390625, -0.0797576904296875, -0.062225341796875, -0.0446929931640625, -0.02716064453125, -0.0096282958984375, 0.007904052734375, 0.0254364013671875, 0.04296875, 0.0605010986328125, 0.078033447265625, 0.0955657958984375, 0.11309814453125, 0.1306304931640625, 0.148162841796875, 0.1656951904296875, 0.1832275390625, 0.2007598876953125, 0.218292236328125, 0.2358245849609375, 0.25335693359375, 0.2708892822265625, 0.288421630859375, 0.3059539794921875, 0.323486328125, 0.3410186767578125, 0.358551025390625, 0.3760833740234375, 0.39361572265625, 0.4111480712890625, 0.428680419921875, 0.4462127685546875, 0.4637451171875, 0.4812774658203125, 0.498809814453125, 0.5163421630859375, 0.53387451171875, 0.5514068603515625, 0.568939208984375, 0.5864715576171875, 0.60400390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 12.0, 36.0, 79.0, 196.0, 610.0, 3402.0, 1027021.0, 15698.0, 971.0, 298.0, 112.0, 56.0, 19.0, 13.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.1197509765625, -3.007080078125, -2.8944091796875, -2.78173828125, -2.6690673828125, -2.556396484375, -2.4437255859375, -2.3310546875, -2.2183837890625, -2.105712890625, -1.9930419921875, -1.88037109375, -1.7677001953125, -1.655029296875, -1.5423583984375, -1.4296875, -1.3170166015625, -1.204345703125, -1.0916748046875, -0.97900390625, -0.8663330078125, -0.753662109375, -0.6409912109375, -0.5283203125, -0.4156494140625, -0.302978515625, -0.1903076171875, -0.07763671875, 0.0350341796875, 0.147705078125, 0.2603759765625, 0.373046875, 0.4857177734375, 0.598388671875, 0.7110595703125, 0.82373046875, 0.9364013671875, 1.049072265625, 1.1617431640625, 1.2744140625, 1.3870849609375, 1.499755859375, 1.6124267578125, 1.72509765625, 1.8377685546875, 1.950439453125, 2.0631103515625, 2.17578125, 2.2884521484375, 2.401123046875, 2.5137939453125, 2.62646484375, 2.7391357421875, 2.851806640625, 2.9644775390625, 3.0771484375, 3.1898193359375, 3.302490234375, 3.4151611328125, 3.52783203125, 3.6405029296875, 3.753173828125, 3.8658447265625, 3.978515625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 10.0, 28.0, 92.0, 268.0, 270.0, 209.0, 95.0, 27.0, 10.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.91046142578125, -7.6802978515625, -7.45013427734375, -7.219970703125, -6.98980712890625, -6.7596435546875, -6.52947998046875, -6.29931640625, -6.06915283203125, -5.8389892578125, -5.60882568359375, -5.378662109375, -5.14849853515625, -4.9183349609375, -4.68817138671875, -4.4580078125, -4.22784423828125, -3.9976806640625, -3.76751708984375, -3.537353515625, -3.30718994140625, -3.0770263671875, -2.84686279296875, -2.61669921875, -2.38653564453125, -2.1563720703125, -1.92620849609375, -1.696044921875, -1.46588134765625, -1.2357177734375, -1.00555419921875, -0.775390625, -0.54522705078125, -0.3150634765625, -0.08489990234375, 0.145263671875, 0.37542724609375, 0.6055908203125, 0.83575439453125, 1.06591796875, 1.29608154296875, 1.5262451171875, 1.75640869140625, 1.986572265625, 2.21673583984375, 2.4468994140625, 2.67706298828125, 2.9072265625, 3.13739013671875, 3.3675537109375, 3.59771728515625, 3.827880859375, 4.05804443359375, 4.2882080078125, 4.51837158203125, 4.74853515625, 4.97869873046875, 5.2088623046875, 5.43902587890625, 5.669189453125, 5.89935302734375, 6.1295166015625, 6.35968017578125, 6.58984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 11.0, 31.0, 120.0, 1040.0, 1042332.0, 4711.0, 225.0, 45.0, 19.0, 10.0, 3.0, 6.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.202667236328125, -4.09674072265625, -3.990814208984375, -3.8848876953125, -3.778961181640625, -3.67303466796875, -3.567108154296875, -3.461181640625, -3.355255126953125, -3.24932861328125, -3.143402099609375, -3.0374755859375, -2.931549072265625, -2.82562255859375, -2.719696044921875, -2.61376953125, -2.507843017578125, -2.40191650390625, -2.295989990234375, -2.1900634765625, -2.084136962890625, -1.97821044921875, -1.872283935546875, -1.766357421875, -1.660430908203125, -1.55450439453125, -1.448577880859375, -1.3426513671875, -1.236724853515625, -1.13079833984375, -1.024871826171875, -0.9189453125, -0.813018798828125, -0.70709228515625, -0.601165771484375, -0.4952392578125, -0.389312744140625, -0.28338623046875, -0.177459716796875, -0.071533203125, 0.034393310546875, 0.14031982421875, 0.246246337890625, 0.3521728515625, 0.458099365234375, 0.56402587890625, 0.669952392578125, 0.77587890625, 0.881805419921875, 0.98773193359375, 1.093658447265625, 1.1995849609375, 1.305511474609375, 1.41143798828125, 1.517364501953125, 1.623291015625, 1.729217529296875, 1.83514404296875, 1.941070556640625, 2.0469970703125, 2.152923583984375, 2.25885009765625, 2.364776611328125, 2.470703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 5.0, 9.0, 7.0, 4.0, 10.0, 8.0, 17.0, 19.0, 32.0, 26.0, 57.0, 68.0, 122.0, 171.0, 132.0, 76.0, 56.0, 38.0, 37.0, 22.0, 14.0, 5.0, 6.0, 11.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010693073272705078, -0.00010365061461925507, -0.00010037049651145935, -9.709037840366364e-05, -9.381026029586792e-05, -9.05301421880722e-05, -8.725002408027649e-05, -8.396990597248077e-05, -8.068978786468506e-05, -7.740966975688934e-05, -7.412955164909363e-05, -7.084943354129791e-05, -6.75693154335022e-05, -6.428919732570648e-05, -6.1009079217910767e-05, -5.772896111011505e-05, -5.4448843002319336e-05, -5.116872489452362e-05, -4.7888606786727905e-05, -4.460848867893219e-05, -4.1328370571136475e-05, -3.804825246334076e-05, -3.4768134355545044e-05, -3.148801624774933e-05, -2.8207898139953613e-05, -2.4927780032157898e-05, -2.1647661924362183e-05, -1.8367543816566467e-05, -1.5087425708770752e-05, -1.1807307600975037e-05, -8.527189493179321e-06, -5.247071385383606e-06, -1.9669532775878906e-06, 1.3131648302078247e-06, 4.59328293800354e-06, 7.873401045799255e-06, 1.115351915359497e-05, 1.4433637261390686e-05, 1.77137553691864e-05, 2.0993873476982117e-05, 2.4273991584777832e-05, 2.7554109692573547e-05, 3.083422780036926e-05, 3.411434590816498e-05, 3.739446401596069e-05, 4.067458212375641e-05, 4.3954700231552124e-05, 4.723481833934784e-05, 5.0514936447143555e-05, 5.379505455493927e-05, 5.7075172662734985e-05, 6.03552907705307e-05, 6.363540887832642e-05, 6.691552698612213e-05, 7.019564509391785e-05, 7.347576320171356e-05, 7.675588130950928e-05, 8.003599941730499e-05, 8.331611752510071e-05, 8.659623563289642e-05, 8.987635374069214e-05, 9.315647184848785e-05, 9.643658995628357e-05, 9.971670806407928e-05, 0.000102996826171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 19.0, 95.0, 365.0, 8637.0, 1037654.0, 1500.0, 188.0, 57.0, 16.0, 8.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.142578125, -2.05438232421875, -1.9661865234375, -1.87799072265625, -1.789794921875, -1.70159912109375, -1.6134033203125, -1.52520751953125, -1.43701171875, -1.34881591796875, -1.2606201171875, -1.17242431640625, -1.084228515625, -0.99603271484375, -0.9078369140625, -0.81964111328125, -0.7314453125, -0.64324951171875, -0.5550537109375, -0.46685791015625, -0.378662109375, -0.29046630859375, -0.2022705078125, -0.11407470703125, -0.02587890625, 0.06231689453125, 0.1505126953125, 0.23870849609375, 0.326904296875, 0.41510009765625, 0.5032958984375, 0.59149169921875, 0.6796875, 0.76788330078125, 0.8560791015625, 0.94427490234375, 1.032470703125, 1.12066650390625, 1.2088623046875, 1.29705810546875, 1.38525390625, 1.47344970703125, 1.5616455078125, 1.64984130859375, 1.738037109375, 1.82623291015625, 1.9144287109375, 2.00262451171875, 2.0908203125, 2.17901611328125, 2.2672119140625, 2.35540771484375, 2.443603515625, 2.53179931640625, 2.6199951171875, 2.70819091796875, 2.79638671875, 2.88458251953125, 2.9727783203125, 3.06097412109375, 3.149169921875, 3.23736572265625, 3.3255615234375, 3.41375732421875, 3.501953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 14.0, 55.0, 432.0, 407.0, 54.0, 20.0, 5.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.071685791015625, -1.00860595703125, -0.945526123046875, -0.8824462890625, -0.819366455078125, -0.75628662109375, -0.693206787109375, -0.630126953125, -0.567047119140625, -0.50396728515625, -0.440887451171875, -0.3778076171875, -0.314727783203125, -0.25164794921875, -0.188568115234375, -0.12548828125, -0.062408447265625, 0.00067138671875, 0.063751220703125, 0.1268310546875, 0.189910888671875, 0.25299072265625, 0.316070556640625, 0.379150390625, 0.442230224609375, 0.50531005859375, 0.568389892578125, 0.6314697265625, 0.694549560546875, 0.75762939453125, 0.820709228515625, 0.8837890625, 0.946868896484375, 1.00994873046875, 1.073028564453125, 1.1361083984375, 1.199188232421875, 1.26226806640625, 1.325347900390625, 1.388427734375, 1.451507568359375, 1.51458740234375, 1.577667236328125, 1.6407470703125, 1.703826904296875, 1.76690673828125, 1.829986572265625, 1.89306640625, 1.956146240234375, 2.01922607421875, 2.082305908203125, 2.1453857421875, 2.208465576171875, 2.27154541015625, 2.334625244140625, 2.397705078125, 2.460784912109375, 2.52386474609375, 2.586944580078125, 2.6500244140625, 2.713104248046875, 2.77618408203125, 2.839263916015625, 2.90234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 20.0, 52.0, 345.0, 510.0, 44.0, 12.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40204620361328, -37.2132682800293, -36.02449035644531, -34.83570861816406, -33.64693069458008, -32.458152770996094, -31.26937484741211, -30.080595016479492, -28.891815185546875, -27.70303726196289, -26.514257431030273, -25.32547950744629, -24.136699676513672, -22.947921752929688, -21.759143829345703, -20.570363998413086, -19.3815860748291, -18.192808151245117, -17.0040283203125, -15.815250396728516, -14.626470565795898, -13.437692642211914, -12.248913764953613, -11.060134887695312, -9.871356010437012, -8.682577133178711, -7.49379825592041, -6.305019855499268, -5.116240978240967, -3.927462100982666, -2.7386837005615234, -1.5499048233032227, -0.3611259460449219, 0.8276528120040894, 2.0164315700531006, 3.2052102088928223, 4.393989086151123, 5.582767963409424, 6.771546363830566, 7.960325241088867, 9.149104118347168, 10.337882995605469, 11.52666187286377, 12.71544075012207, 13.904218673706055, 15.092998504638672, 16.281776428222656, 17.47055435180664, 18.659334182739258, 19.848112106323242, 21.03689193725586, 22.225669860839844, 23.41444969177246, 24.603227615356445, 25.792007446289062, 26.980785369873047, 28.16956329345703, 29.358341217041016, 30.547121047973633, 31.735898971557617, 32.924678802490234, 34.11345672607422, 35.3022346496582, 36.49101257324219, 37.67979431152344]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 3.0, 6.0, 5.0, 10.0, 14.0, 18.0, 23.0, 27.0, 45.0, 29.0, 32.0, 46.0, 57.0, 63.0, 75.0, 60.0, 58.0, 63.0, 71.0, 45.0, 45.0, 50.0, 25.0, 23.0, 25.0, 14.0, 17.0, 9.0, 6.0, 9.0, 5.0, 11.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-16.041461944580078, -15.645145416259766, -15.248828887939453, -14.852511405944824, -14.456194877624512, -14.0598783493042, -13.66356086730957, -13.267244338989258, -12.870927810668945, -12.474611282348633, -12.07829475402832, -11.681977272033691, -11.285660743713379, -10.889344215393066, -10.493026733398438, -10.096710205078125, -9.700393676757812, -9.3040771484375, -8.907760620117188, -8.511443138122559, -8.115126609802246, -7.718810081481934, -7.322493076324463, -6.926176071166992, -6.52985954284668, -6.133543014526367, -5.7372260093688965, -5.340909004211426, -4.944592475891113, -4.548275947570801, -4.15195894241333, -3.7556421756744385, -3.359325408935547, -2.9630086421966553, -2.5666918754577637, -2.170375108718872, -1.7740583419799805, -1.3777415752410889, -0.9814248085021973, -0.5851080417633057, -0.18879127502441406, 0.20752549171447754, 0.6038422584533691, 1.0001590251922607, 1.3964757919311523, 1.792792558670044, 2.1891093254089355, 2.585426092147827, 2.9817428588867188, 3.3780596256256104, 3.774376392364502, 4.170693397521973, 4.567009925842285, 4.963326454162598, 5.359643459320068, 5.755960464477539, 6.152276992797852, 6.548593521118164, 6.944910526275635, 7.3412275314331055, 7.737544059753418, 8.13386058807373, 8.53017807006836, 8.926494598388672, 9.322811126708984]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 8.0, 15.0, 15.0, 23.0, 32.0, 49.0, 84.0, 113.0, 157.0, 258.0, 356.0, 660.0, 1124.0, 1924.0, 3987.0, 8995.0, 26012.0, 142763.0, 3075730.0, 846898.0, 56645.0, 15315.0, 6033.0, 2909.0, 1611.0, 891.0, 573.0, 347.0, 219.0, 163.0, 98.0, 64.0, 54.0, 48.0, 28.0, 14.0, 18.0, 6.0, 8.0, 4.0, 7.0, 4.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.357421875, -0.3468437194824219, -0.33626556396484375, -0.3256874084472656, -0.3151092529296875, -0.3045310974121094, -0.29395294189453125, -0.2833747863769531, -0.272796630859375, -0.2622184753417969, -0.25164031982421875, -0.24106216430664062, -0.2304840087890625, -0.21990585327148438, -0.20932769775390625, -0.19874954223632812, -0.18817138671875, -0.17759323120117188, -0.16701507568359375, -0.15643692016601562, -0.1458587646484375, -0.13528060913085938, -0.12470245361328125, -0.11412429809570312, -0.103546142578125, -0.09296798706054688, -0.08238983154296875, -0.07181167602539062, -0.0612335205078125, -0.050655364990234375, -0.04007720947265625, -0.029499053955078125, -0.0189208984375, -0.008342742919921875, 0.00223541259765625, 0.012813568115234375, 0.0233917236328125, 0.033969879150390625, 0.04454803466796875, 0.055126190185546875, 0.065704345703125, 0.07628250122070312, 0.08686065673828125, 0.09743881225585938, 0.1080169677734375, 0.11859512329101562, 0.12917327880859375, 0.13975143432617188, 0.15032958984375, 0.16090774536132812, 0.17148590087890625, 0.18206405639648438, 0.1926422119140625, 0.20322036743164062, 0.21379852294921875, 0.22437667846679688, 0.234954833984375, 0.24553298950195312, 0.25611114501953125, 0.2666893005371094, 0.2772674560546875, 0.2878456115722656, 0.29842376708984375, 0.3090019226074219, 0.319580078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 6.0, 3.0, 13.0, 19.0, 19.0, 27.0, 27.0, 49.0, 56.0, 68.0, 70.0, 88.0, 74.0, 88.0, 79.0, 68.0, 65.0, 36.0, 23.0, 36.0, 29.0, 14.0, 8.0, 5.0, 7.0, 5.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395751953125, -0.3832664489746094, -0.37078094482421875, -0.3582954406738281, -0.3458099365234375, -0.3333244323730469, -0.32083892822265625, -0.3083534240722656, -0.295867919921875, -0.2833824157714844, -0.27089691162109375, -0.2584114074707031, -0.2459259033203125, -0.23344039916992188, -0.22095489501953125, -0.20846939086914062, -0.19598388671875, -0.18349838256835938, -0.17101287841796875, -0.15852737426757812, -0.1460418701171875, -0.13355636596679688, -0.12107086181640625, -0.10858535766601562, -0.096099853515625, -0.08361434936523438, -0.07112884521484375, -0.058643341064453125, -0.0461578369140625, -0.033672332763671875, -0.02118682861328125, -0.008701324462890625, 0.0037841796875, 0.016269683837890625, 0.02875518798828125, 0.041240692138671875, 0.0537261962890625, 0.06621170043945312, 0.07869720458984375, 0.09118270874023438, 0.103668212890625, 0.11615371704101562, 0.12863922119140625, 0.14112472534179688, 0.1536102294921875, 0.16609573364257812, 0.17858123779296875, 0.19106674194335938, 0.20355224609375, 0.21603775024414062, 0.22852325439453125, 0.24100875854492188, 0.2534942626953125, 0.2659797668457031, 0.27846527099609375, 0.2909507751464844, 0.303436279296875, 0.3159217834472656, 0.32840728759765625, 0.3408927917480469, 0.3533782958984375, 0.3658638000488281, 0.37834930419921875, 0.3908348083496094, 0.4033203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 3.0, 3.0, 11.0, 15.0, 36.0, 50.0, 61.0, 114.0, 199.0, 493.0, 1254.0, 4833.0, 23698.0, 950106.0, 3172635.0, 31834.0, 6083.0, 1570.0, 594.0, 281.0, 136.0, 91.0, 60.0, 42.0, 25.0, 16.0, 5.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.79150390625, -0.7651748657226562, -0.7388458251953125, -0.7125167846679688, -0.686187744140625, -0.6598587036132812, -0.6335296630859375, -0.6072006225585938, -0.58087158203125, -0.5545425415039062, -0.5282135009765625, -0.5018844604492188, -0.475555419921875, -0.44922637939453125, -0.4228973388671875, -0.39656829833984375, -0.3702392578125, -0.34391021728515625, -0.3175811767578125, -0.29125213623046875, -0.264923095703125, -0.23859405517578125, -0.2122650146484375, -0.18593597412109375, -0.15960693359375, -0.13327789306640625, -0.1069488525390625, -0.08061981201171875, -0.054290771484375, -0.02796173095703125, -0.0016326904296875, 0.02469635009765625, 0.051025390625, 0.07735443115234375, 0.1036834716796875, 0.13001251220703125, 0.156341552734375, 0.18267059326171875, 0.2089996337890625, 0.23532867431640625, 0.26165771484375, 0.28798675537109375, 0.3143157958984375, 0.34064483642578125, 0.366973876953125, 0.39330291748046875, 0.4196319580078125, 0.44596099853515625, 0.4722900390625, 0.49861907958984375, 0.5249481201171875, 0.5512771606445312, 0.577606201171875, 0.6039352416992188, 0.6302642822265625, 0.6565933227539062, 0.68292236328125, 0.7092514038085938, 0.7355804443359375, 0.7619094848632812, 0.788238525390625, 0.8145675659179688, 0.8408966064453125, 0.8672256469726562, 0.8935546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 3.0, 11.0, 6.0, 18.0, 37.0, 80.0, 347.0, 2406.0, 825.0, 159.0, 58.0, 31.0, 29.0, 10.0, 20.0, 7.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447265625, -0.8074188232421875, -0.770111083984375, -0.7328033447265625, -0.69549560546875, -0.6581878662109375, -0.620880126953125, -0.5835723876953125, -0.5462646484375, -0.5089569091796875, -0.471649169921875, -0.4343414306640625, -0.39703369140625, -0.3597259521484375, -0.322418212890625, -0.2851104736328125, -0.247802734375, -0.2104949951171875, -0.173187255859375, -0.1358795166015625, -0.09857177734375, -0.0612640380859375, -0.023956298828125, 0.0133514404296875, 0.0506591796875, 0.0879669189453125, 0.125274658203125, 0.1625823974609375, 0.19989013671875, 0.2371978759765625, 0.274505615234375, 0.3118133544921875, 0.34912109375, 0.3864288330078125, 0.423736572265625, 0.4610443115234375, 0.49835205078125, 0.5356597900390625, 0.572967529296875, 0.6102752685546875, 0.6475830078125, 0.6848907470703125, 0.722198486328125, 0.7595062255859375, 0.79681396484375, 0.8341217041015625, 0.871429443359375, 0.9087371826171875, 0.946044921875, 0.9833526611328125, 1.020660400390625, 1.0579681396484375, 1.09527587890625, 1.1325836181640625, 1.169891357421875, 1.2071990966796875, 1.2445068359375, 1.2818145751953125, 1.319122314453125, 1.3564300537109375, 1.39373779296875, 1.4310455322265625, 1.468353271484375, 1.5056610107421875, 1.54296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 10.0, 34.0, 180.0, 446.0, 201.0, 46.0, 28.0, 12.0, 6.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4840898513793945, -7.1733880043029785, -6.8626861572265625, -6.5519843101501465, -6.2412824630737305, -5.930580139160156, -5.61987829208374, -5.309176445007324, -4.998474597930908, -4.687772750854492, -4.377070903778076, -4.06636905670166, -3.755666971206665, -3.444965124130249, -3.134263038635254, -2.823561191558838, -2.512859344482422, -2.202157497406006, -1.8914555311203003, -1.5807535648345947, -1.2700517177581787, -0.9593498706817627, -0.6486479043960571, -0.33794593811035156, -0.027244091033935547, 0.28345781564712524, 0.594159722328186, 0.9048616290092468, 1.2155635356903076, 1.5262653827667236, 1.8369673490524292, 2.1476693153381348, 2.458372116088867, 2.769073963165283, 3.079775810241699, 3.3904778957366943, 3.7011797428131104, 4.0118818283081055, 4.3225836753845215, 4.6332855224609375, 4.9439873695373535, 5.2546892166137695, 5.5653910636901855, 5.876092910766602, 6.186795234680176, 6.497496604919434, 6.808198928833008, 7.118900775909424, 7.42960262298584, 7.740304470062256, 8.051006317138672, 8.361708641052246, 8.672410011291504, 8.983112335205078, 9.293813705444336, 9.60451602935791, 9.915218353271484, 10.225920677185059, 10.536622047424316, 10.84732437133789, 11.158025741577148, 11.468728065490723, 11.77942943572998, 12.090131759643555, 12.400833129882812]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 15.0, 15.0, 16.0, 27.0, 30.0, 40.0, 58.0, 44.0, 46.0, 77.0, 66.0, 64.0, 60.0, 56.0, 64.0, 41.0, 59.0, 50.0, 30.0, 15.0, 20.0, 21.0, 17.0, 20.0, 8.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.888029098510742, -4.734557151794434, -4.581085205078125, -4.427613258361816, -4.274141311645508, -4.120669364929199, -3.9671971797943115, -3.813724994659424, -3.6602530479431152, -3.5067811012268066, -3.353309154510498, -3.1998372077941895, -3.0463650226593018, -2.892893075942993, -2.7394211292266846, -2.585948944091797, -2.4324772357940674, -2.279005289077759, -2.12553334236145, -1.972061276435852, -1.818589210510254, -1.6651172637939453, -1.5116453170776367, -1.3581732511520386, -1.20470130443573, -1.0512293577194214, -0.8977572917938232, -0.7442853450775146, -0.5908133387565613, -0.4373413324356079, -0.2838693857192993, -0.13039731979370117, 0.023074626922607422, 0.1765466183423996, 0.3300186097621918, 0.48349058628082275, 0.6369625926017761, 0.7904345989227295, 0.9439065456390381, 1.0973786115646362, 1.2508505582809448, 1.4043225049972534, 1.5577945709228516, 1.7112665176391602, 1.8647384643554688, 2.0182104110717773, 2.171682357788086, 2.3251545429229736, 2.4786264896392822, 2.632098436355591, 2.7855703830718994, 2.939042568206787, 3.0925145149230957, 3.2459864616394043, 3.399458408355713, 3.5529303550720215, 3.70640230178833, 3.8598742485046387, 4.013346195220947, 4.166818141937256, 4.3202900886535645, 4.473762512207031, 4.62723445892334, 4.780706405639648, 4.934178352355957]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 8.0, 10.0, 14.0, 16.0, 25.0, 37.0, 34.0, 73.0, 87.0, 125.0, 202.0, 318.0, 474.0, 761.0, 1152.0, 1863.0, 3066.0, 5579.0, 10167.0, 20131.0, 43628.0, 105611.0, 262116.0, 329765.0, 147640.0, 59636.0, 26444.0, 12748.0, 6881.0, 3821.0, 2283.0, 1349.0, 839.0, 585.0, 328.0, 232.0, 153.0, 102.0, 70.0, 57.0, 38.0, 14.0, 17.0, 18.0, 11.0, 11.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-0.2333984375, -0.22657012939453125, -0.2197418212890625, -0.21291351318359375, -0.206085205078125, -0.19925689697265625, -0.1924285888671875, -0.18560028076171875, -0.17877197265625, -0.17194366455078125, -0.1651153564453125, -0.15828704833984375, -0.151458740234375, -0.14463043212890625, -0.1378021240234375, -0.13097381591796875, -0.1241455078125, -0.11731719970703125, -0.1104888916015625, -0.10366058349609375, -0.096832275390625, -0.09000396728515625, -0.0831756591796875, -0.07634735107421875, -0.06951904296875, -0.06269073486328125, -0.0558624267578125, -0.04903411865234375, -0.042205810546875, -0.03537750244140625, -0.0285491943359375, -0.02172088623046875, -0.014892578125, -0.00806427001953125, -0.0012359619140625, 0.00559234619140625, 0.012420654296875, 0.01924896240234375, 0.0260772705078125, 0.03290557861328125, 0.03973388671875, 0.04656219482421875, 0.0533905029296875, 0.06021881103515625, 0.067047119140625, 0.07387542724609375, 0.0807037353515625, 0.08753204345703125, 0.0943603515625, 0.10118865966796875, 0.1080169677734375, 0.11484527587890625, 0.121673583984375, 0.12850189208984375, 0.1353302001953125, 0.14215850830078125, 0.14898681640625, 0.15581512451171875, 0.1626434326171875, 0.16947174072265625, 0.176300048828125, 0.18312835693359375, 0.1899566650390625, 0.19678497314453125, 0.20361328125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 6.0, 10.0, 12.0, 14.0, 18.0, 17.0, 20.0, 30.0, 34.0, 32.0, 44.0, 58.0, 61.0, 64.0, 58.0, 55.0, 66.0, 60.0, 41.0, 56.0, 41.0, 36.0, 35.0, 26.0, 14.0, 14.0, 13.0, 8.0, 9.0, 8.0, 4.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.278839111328125, -0.26959228515625, -0.260345458984375, -0.2510986328125, -0.241851806640625, -0.23260498046875, -0.223358154296875, -0.214111328125, -0.204864501953125, -0.19561767578125, -0.186370849609375, -0.1771240234375, -0.167877197265625, -0.15863037109375, -0.149383544921875, -0.14013671875, -0.130889892578125, -0.12164306640625, -0.112396240234375, -0.1031494140625, -0.093902587890625, -0.08465576171875, -0.075408935546875, -0.066162109375, -0.056915283203125, -0.04766845703125, -0.038421630859375, -0.0291748046875, -0.019927978515625, -0.01068115234375, -0.001434326171875, 0.0078125, 0.017059326171875, 0.02630615234375, 0.035552978515625, 0.0447998046875, 0.054046630859375, 0.06329345703125, 0.072540283203125, 0.081787109375, 0.091033935546875, 0.10028076171875, 0.109527587890625, 0.1187744140625, 0.128021240234375, 0.13726806640625, 0.146514892578125, 0.15576171875, 0.165008544921875, 0.17425537109375, 0.183502197265625, 0.1927490234375, 0.201995849609375, 0.21124267578125, 0.220489501953125, 0.229736328125, 0.238983154296875, 0.24822998046875, 0.257476806640625, 0.2667236328125, 0.275970458984375, 0.28521728515625, 0.294464111328125, 0.3037109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 5.0, 9.0, 16.0, 25.0, 30.0, 42.0, 65.0, 110.0, 143.0, 267.0, 452.0, 826.0, 2134.0, 10171.0, 252106.0, 757745.0, 19040.0, 3056.0, 987.0, 515.0, 277.0, 160.0, 105.0, 90.0, 58.0, 45.0, 14.0, 16.0, 13.0, 6.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9794921875, -0.946990966796875, -0.91448974609375, -0.881988525390625, -0.8494873046875, -0.816986083984375, -0.78448486328125, -0.751983642578125, -0.719482421875, -0.686981201171875, -0.65447998046875, -0.621978759765625, -0.5894775390625, -0.556976318359375, -0.52447509765625, -0.491973876953125, -0.45947265625, -0.426971435546875, -0.39447021484375, -0.361968994140625, -0.3294677734375, -0.296966552734375, -0.26446533203125, -0.231964111328125, -0.199462890625, -0.166961669921875, -0.13446044921875, -0.101959228515625, -0.0694580078125, -0.036956787109375, -0.00445556640625, 0.028045654296875, 0.060546875, 0.093048095703125, 0.12554931640625, 0.158050537109375, 0.1905517578125, 0.223052978515625, 0.25555419921875, 0.288055419921875, 0.320556640625, 0.353057861328125, 0.38555908203125, 0.418060302734375, 0.4505615234375, 0.483062744140625, 0.51556396484375, 0.548065185546875, 0.58056640625, 0.613067626953125, 0.64556884765625, 0.678070068359375, 0.7105712890625, 0.743072509765625, 0.77557373046875, 0.808074951171875, 0.840576171875, 0.873077392578125, 0.90557861328125, 0.938079833984375, 0.9705810546875, 1.003082275390625, 1.03558349609375, 1.068084716796875, 1.1005859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 7.0, 11.0, 10.0, 17.0, 16.0, 24.0, 42.0, 46.0, 47.0, 69.0, 64.0, 80.0, 69.0, 74.0, 88.0, 55.0, 45.0, 53.0, 49.0, 36.0, 11.0, 30.0, 14.0, 11.0, 6.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -1.9956512451171875, -1.938568115234375, -1.8814849853515625, -1.82440185546875, -1.7673187255859375, -1.710235595703125, -1.6531524658203125, -1.5960693359375, -1.5389862060546875, -1.481903076171875, -1.4248199462890625, -1.36773681640625, -1.3106536865234375, -1.253570556640625, -1.1964874267578125, -1.139404296875, -1.0823211669921875, -1.025238037109375, -0.9681549072265625, -0.91107177734375, -0.8539886474609375, -0.796905517578125, -0.7398223876953125, -0.6827392578125, -0.6256561279296875, -0.568572998046875, -0.5114898681640625, -0.45440673828125, -0.3973236083984375, -0.340240478515625, -0.2831573486328125, -0.22607421875, -0.1689910888671875, -0.111907958984375, -0.0548248291015625, 0.00225830078125, 0.0593414306640625, 0.116424560546875, 0.1735076904296875, 0.2305908203125, 0.2876739501953125, 0.344757080078125, 0.4018402099609375, 0.45892333984375, 0.5160064697265625, 0.573089599609375, 0.6301727294921875, 0.687255859375, 0.7443389892578125, 0.801422119140625, 0.8585052490234375, 0.91558837890625, 0.9726715087890625, 1.029754638671875, 1.0868377685546875, 1.1439208984375, 1.2010040283203125, 1.258087158203125, 1.3151702880859375, 1.37225341796875, 1.4293365478515625, 1.486419677734375, 1.5435028076171875, 1.6005859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 11.0, 10.0, 24.0, 42.0, 74.0, 99.0, 187.0, 422.0, 1192.0, 5295.0, 80168.0, 926413.0, 29718.0, 3313.0, 856.0, 324.0, 148.0, 100.0, 46.0, 30.0, 25.0, 11.0, 10.0, 2.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.447509765625, -0.4355316162109375, -0.423553466796875, -0.4115753173828125, -0.39959716796875, -0.3876190185546875, -0.375640869140625, -0.3636627197265625, -0.3516845703125, -0.3397064208984375, -0.327728271484375, -0.3157501220703125, -0.30377197265625, -0.2917938232421875, -0.279815673828125, -0.2678375244140625, -0.255859375, -0.2438812255859375, -0.231903076171875, -0.2199249267578125, -0.20794677734375, -0.1959686279296875, -0.183990478515625, -0.1720123291015625, -0.1600341796875, -0.1480560302734375, -0.136077880859375, -0.1240997314453125, -0.11212158203125, -0.1001434326171875, -0.088165283203125, -0.0761871337890625, -0.064208984375, -0.0522308349609375, -0.040252685546875, -0.0282745361328125, -0.01629638671875, -0.0043182373046875, 0.007659912109375, 0.0196380615234375, 0.0316162109375, 0.0435943603515625, 0.055572509765625, 0.0675506591796875, 0.07952880859375, 0.0915069580078125, 0.103485107421875, 0.1154632568359375, 0.12744140625, 0.1394195556640625, 0.151397705078125, 0.1633758544921875, 0.17535400390625, 0.1873321533203125, 0.199310302734375, 0.2112884521484375, 0.2232666015625, 0.2352447509765625, 0.247222900390625, 0.2592010498046875, 0.27117919921875, 0.2831573486328125, 0.295135498046875, 0.3071136474609375, 0.319091796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 0.0, 2.0, 4.0, 8.0, 7.0, 7.0, 8.0, 16.0, 27.0, 19.0, 36.0, 66.0, 108.0, 188.0, 176.0, 114.0, 63.0, 38.0, 25.0, 16.0, 15.0, 17.0, 8.0, 5.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001633167266845703, -0.00015837885439395905, -0.00015344098210334778, -0.0001485031098127365, -0.00014356523752212524, -0.00013862736523151398, -0.0001336894929409027, -0.00012875162065029144, -0.00012381374835968018, -0.00011887587606906891, -0.00011393800377845764, -0.00010900013148784637, -0.00010406225919723511, -9.912438690662384e-05, -9.418651461601257e-05, -8.92486423254013e-05, -8.431077003479004e-05, -7.937289774417877e-05, -7.44350254535675e-05, -6.949715316295624e-05, -6.455928087234497e-05, -5.9621408581733704e-05, -5.4683536291122437e-05, -4.974566400051117e-05, -4.48077917098999e-05, -3.9869919419288635e-05, -3.493204712867737e-05, -2.99941748380661e-05, -2.5056302547454834e-05, -2.0118430256843567e-05, -1.51805579662323e-05, -1.0242685675621033e-05, -5.304813385009766e-06, -3.6694109439849854e-07, 4.5709311962127686e-06, 9.508803486824036e-06, 1.4446675777435303e-05, 1.938454806804657e-05, 2.4322420358657837e-05, 2.9260292649269104e-05, 3.419816493988037e-05, 3.913603723049164e-05, 4.4073909521102905e-05, 4.901178181171417e-05, 5.394965410232544e-05, 5.8887526392936707e-05, 6.382539868354797e-05, 6.876327097415924e-05, 7.370114326477051e-05, 7.863901555538177e-05, 8.357688784599304e-05, 8.851476013660431e-05, 9.345263242721558e-05, 9.839050471782684e-05, 0.00010332837700843811, 0.00010826624929904938, 0.00011320412158966064, 0.00011814199388027191, 0.00012307986617088318, 0.00012801773846149445, 0.0001329556107521057, 0.00013789348304271698, 0.00014283135533332825, 0.00014776922762393951, 0.00015270709991455078]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 1.0, 11.0, 10.0, 15.0, 20.0, 33.0, 44.0, 82.0, 128.0, 263.0, 536.0, 1458.0, 6179.0, 72894.0, 906975.0, 52205.0, 5315.0, 1313.0, 486.0, 232.0, 142.0, 90.0, 52.0, 14.0, 23.0, 9.0, 9.0, 5.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.2172260284423828, -0.20605850219726562, -0.19489097595214844, -0.18372344970703125, -0.17255592346191406, -0.16138839721679688, -0.1502208709716797, -0.1390533447265625, -0.1278858184814453, -0.11671829223632812, -0.10555076599121094, -0.09438323974609375, -0.08321571350097656, -0.07204818725585938, -0.06088066101074219, -0.049713134765625, -0.03854560852050781, -0.027378082275390625, -0.016210556030273438, -0.00504302978515625, 0.0061244964599609375, 0.017292022705078125, 0.028459548950195312, 0.0396270751953125, 0.05079460144042969, 0.061962127685546875, 0.07312965393066406, 0.08429718017578125, 0.09546470642089844, 0.10663223266601562, 0.11779975891113281, 0.12896728515625, 0.1401348114013672, 0.15130233764648438, 0.16246986389160156, 0.17363739013671875, 0.18480491638183594, 0.19597244262695312, 0.2071399688720703, 0.2183074951171875, 0.2294750213623047, 0.24064254760742188, 0.25181007385253906, 0.26297760009765625, 0.27414512634277344, 0.2853126525878906, 0.2964801788330078, 0.307647705078125, 0.3188152313232422, 0.3299827575683594, 0.34115028381347656, 0.35231781005859375, 0.36348533630371094, 0.3746528625488281, 0.3858203887939453, 0.3969879150390625, 0.4081554412841797, 0.4193229675292969, 0.43049049377441406, 0.44165802001953125, 0.45282554626464844, 0.4639930725097656, 0.4751605987548828, 0.486328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 5.0, 11.0, 8.0, 10.0, 20.0, 23.0, 15.0, 34.0, 51.0, 39.0, 54.0, 68.0, 54.0, 78.0, 64.0, 74.0, 71.0, 54.0, 49.0, 56.0, 32.0, 25.0, 22.0, 9.0, 15.0, 10.0, 8.0, 2.0, 12.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.302734375, -0.29532814025878906, -0.2879219055175781, -0.2805156707763672, -0.27310943603515625, -0.2657032012939453, -0.2582969665527344, -0.25089073181152344, -0.2434844970703125, -0.23607826232910156, -0.22867202758789062, -0.2212657928466797, -0.21385955810546875, -0.2064533233642578, -0.19904708862304688, -0.19164085388183594, -0.184234619140625, -0.17682838439941406, -0.16942214965820312, -0.1620159149169922, -0.15460968017578125, -0.1472034454345703, -0.13979721069335938, -0.13239097595214844, -0.1249847412109375, -0.11757850646972656, -0.11017227172851562, -0.10276603698730469, -0.09535980224609375, -0.08795356750488281, -0.08054733276367188, -0.07314109802246094, -0.06573486328125, -0.05832862854003906, -0.050922393798828125, -0.04351615905761719, -0.03610992431640625, -0.028703689575195312, -0.021297454833984375, -0.013891220092773438, -0.0064849853515625, 0.0009212493896484375, 0.008327484130859375, 0.015733718872070312, 0.02313995361328125, 0.030546188354492188, 0.037952423095703125, 0.04535865783691406, 0.052764892578125, 0.06017112731933594, 0.06757736206054688, 0.07498359680175781, 0.08238983154296875, 0.08979606628417969, 0.09720230102539062, 0.10460853576660156, 0.1120147705078125, 0.11942100524902344, 0.12682723999023438, 0.1342334747314453, 0.14163970947265625, 0.1490459442138672, 0.15645217895507812, 0.16385841369628906, 0.1712646484375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 14.0, 76.0, 560.0, 283.0, 43.0, 19.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1772518157959, -18.717815399169922, -18.258378982543945, -17.79894256591797, -17.33950424194336, -16.880067825317383, -16.420631408691406, -15.96119499206543, -15.501758575439453, -15.042322158813477, -14.5828857421875, -14.123448371887207, -13.66401195526123, -13.204575538635254, -12.745138168334961, -12.285701751708984, -11.826265335083008, -11.366828918457031, -10.907392501831055, -10.447955131530762, -9.988518714904785, -9.529082298278809, -9.069644927978516, -8.610208511352539, -8.150772094726562, -7.691335678100586, -7.231898784637451, -6.772461891174316, -6.31302547454834, -5.853589057922363, -5.3941521644592285, -4.934715270996094, -4.475277900695801, -4.015841484069824, -3.5564045906066895, -3.096967935562134, -2.637531280517578, -2.1780946254730225, -1.7186579704284668, -1.2592213153839111, -0.7997846603393555, -0.3403480052947998, 0.11908864974975586, 0.5785253047943115, 1.0379619598388672, 1.4973986148834229, 1.9568352699279785, 2.416271924972534, 2.87570858001709, 3.3351452350616455, 3.794581890106201, 4.254018783569336, 4.7134552001953125, 5.172891616821289, 5.632328510284424, 6.091765403747559, 6.551201820373535, 7.010638236999512, 7.4700751304626465, 7.929512023925781, 8.388948440551758, 8.848384857177734, 9.307821273803711, 9.767258644104004, 10.22669506072998]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 8.0, 8.0, 15.0, 9.0, 14.0, 21.0, 31.0, 29.0, 32.0, 52.0, 40.0, 59.0, 67.0, 78.0, 73.0, 65.0, 66.0, 58.0, 48.0, 48.0, 27.0, 29.0, 27.0, 23.0, 20.0, 8.0, 11.0, 10.0, 12.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.539610862731934, -5.338078022003174, -5.136545181274414, -4.935012340545654, -4.7334794998168945, -4.531946182250977, -4.330413341522217, -4.128880500793457, -3.9273476600646973, -3.7258148193359375, -3.5242819786071777, -3.322748899459839, -3.121216058731079, -2.9196832180023193, -2.7181501388549805, -2.5166172981262207, -2.315084457397461, -2.113551616668701, -1.9120186567306519, -1.7104856967926025, -1.5089528560638428, -1.307420015335083, -1.1058870553970337, -0.9043540954589844, -0.7028212547302246, -0.5012883543968201, -0.2997554540634155, -0.09822255373001099, 0.10331034660339355, 0.3048431873321533, 0.5063761472702026, 0.707909107208252, 0.9094424247741699, 1.1109752655029297, 1.312508225440979, 1.5140411853790283, 1.715574026107788, 1.9171068668365479, 2.1186399459838867, 2.3201727867126465, 2.5217056274414062, 2.723238468170166, 2.924771308898926, 3.1263043880462646, 3.3278372287750244, 3.529370069503784, 3.730903148651123, 3.932435989379883, 4.133968830108643, 4.335501670837402, 4.537034511566162, 4.738567352294922, 4.94010066986084, 5.141633033752441, 5.343166351318359, 5.544699192047119, 5.746232032775879, 5.947764873504639, 6.149297714233398, 6.350830554962158, 6.552363395690918, 6.753896713256836, 6.955429553985596, 7.1569623947143555, 7.358495235443115]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 11.0, 10.0, 11.0, 23.0, 10.0, 24.0, 41.0, 62.0, 58.0, 117.0, 292.0, 630.0, 1968.0, 7096.0, 51299.0, 3892196.0, 227285.0, 9238.0, 2112.0, 805.0, 355.0, 194.0, 113.0, 83.0, 53.0, 32.0, 33.0, 21.0, 26.0, 19.0, 12.0, 12.0, 7.0, 3.0, 10.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.66650390625, -0.6467132568359375, -0.626922607421875, -0.6071319580078125, -0.58734130859375, -0.5675506591796875, -0.547760009765625, -0.5279693603515625, -0.5081787109375, -0.4883880615234375, -0.468597412109375, -0.4488067626953125, -0.42901611328125, -0.4092254638671875, -0.389434814453125, -0.3696441650390625, -0.349853515625, -0.3300628662109375, -0.310272216796875, -0.2904815673828125, -0.27069091796875, -0.2509002685546875, -0.231109619140625, -0.2113189697265625, -0.1915283203125, -0.1717376708984375, -0.151947021484375, -0.1321563720703125, -0.11236572265625, -0.0925750732421875, -0.072784423828125, -0.0529937744140625, -0.033203125, -0.0134124755859375, 0.006378173828125, 0.0261688232421875, 0.04595947265625, 0.0657501220703125, 0.085540771484375, 0.1053314208984375, 0.1251220703125, 0.1449127197265625, 0.164703369140625, 0.1844940185546875, 0.20428466796875, 0.2240753173828125, 0.243865966796875, 0.2636566162109375, 0.283447265625, 0.3032379150390625, 0.323028564453125, 0.3428192138671875, 0.36260986328125, 0.3824005126953125, 0.402191162109375, 0.4219818115234375, 0.4417724609375, 0.4615631103515625, 0.481353759765625, 0.5011444091796875, 0.52093505859375, 0.5407257080078125, 0.560516357421875, 0.5803070068359375, 0.60009765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 12.0, 17.0, 23.0, 39.0, 61.0, 81.0, 117.0, 122.0, 135.0, 123.0, 101.0, 66.0, 36.0, 25.0, 16.0, 16.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315673828125, -0.2962226867675781, -0.27677154541015625, -0.2573204040527344, -0.2378692626953125, -0.21841812133789062, -0.19896697998046875, -0.17951583862304688, -0.160064697265625, -0.14061355590820312, -0.12116241455078125, -0.10171127319335938, -0.0822601318359375, -0.06280899047851562, -0.04335784912109375, -0.023906707763671875, -0.00445556640625, 0.014995574951171875, 0.03444671630859375, 0.053897857666015625, 0.0733489990234375, 0.09280014038085938, 0.11225128173828125, 0.13170242309570312, 0.151153564453125, 0.17060470581054688, 0.19005584716796875, 0.20950698852539062, 0.2289581298828125, 0.24840927124023438, 0.26786041259765625, 0.2873115539550781, 0.3067626953125, 0.3262138366699219, 0.34566497802734375, 0.3651161193847656, 0.3845672607421875, 0.4040184020996094, 0.42346954345703125, 0.4429206848144531, 0.462371826171875, 0.4818229675292969, 0.5012741088867188, 0.5207252502441406, 0.5401763916015625, 0.5596275329589844, 0.5790786743164062, 0.5985298156738281, 0.61798095703125, 0.6374320983886719, 0.6568832397460938, 0.6763343811035156, 0.6957855224609375, 0.7152366638183594, 0.7346878051757812, 0.7541389465332031, 0.773590087890625, 0.7930412292480469, 0.8124923706054688, 0.8319435119628906, 0.8513946533203125, 0.8708457946777344, 0.8902969360351562, 0.9097480773925781, 0.92919921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 9.0, 11.0, 23.0, 25.0, 21.0, 37.0, 50.0, 57.0, 148.0, 378.0, 1486.0, 6715.0, 44057.0, 3758659.0, 360516.0, 17612.0, 3059.0, 711.0, 212.0, 120.0, 69.0, 66.0, 60.0, 40.0, 39.0, 34.0, 23.0, 15.0, 12.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8125, -0.7898025512695312, -0.7671051025390625, -0.7444076538085938, -0.721710205078125, -0.6990127563476562, -0.6763153076171875, -0.6536178588867188, -0.63092041015625, -0.6082229614257812, -0.5855255126953125, -0.5628280639648438, -0.540130615234375, -0.5174331665039062, -0.4947357177734375, -0.47203826904296875, -0.4493408203125, -0.42664337158203125, -0.4039459228515625, -0.38124847412109375, -0.358551025390625, -0.33585357666015625, -0.3131561279296875, -0.29045867919921875, -0.26776123046875, -0.24506378173828125, -0.2223663330078125, -0.19966888427734375, -0.176971435546875, -0.15427398681640625, -0.1315765380859375, -0.10887908935546875, -0.086181640625, -0.06348419189453125, -0.0407867431640625, -0.01808929443359375, 0.004608154296875, 0.02730560302734375, 0.0500030517578125, 0.07270050048828125, 0.09539794921875, 0.11809539794921875, 0.1407928466796875, 0.16349029541015625, 0.186187744140625, 0.20888519287109375, 0.2315826416015625, 0.25428009033203125, 0.2769775390625, 0.29967498779296875, 0.3223724365234375, 0.34506988525390625, 0.367767333984375, 0.39046478271484375, 0.4131622314453125, 0.43585968017578125, 0.45855712890625, 0.48125457763671875, 0.5039520263671875, 0.5266494750976562, 0.549346923828125, 0.5720443725585938, 0.5947418212890625, 0.6174392700195312, 0.64013671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 7.0, 14.0, 20.0, 22.0, 42.0, 96.0, 457.0, 2268.0, 883.0, 150.0, 46.0, 29.0, 15.0, 11.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.493896484375, -0.4601020812988281, -0.42630767822265625, -0.3925132751464844, -0.3587188720703125, -0.3249244689941406, -0.29113006591796875, -0.2573356628417969, -0.223541259765625, -0.18974685668945312, -0.15595245361328125, -0.12215805053710938, -0.0883636474609375, -0.054569244384765625, -0.02077484130859375, 0.013019561767578125, 0.04681396484375, 0.08060836791992188, 0.11440277099609375, 0.14819717407226562, 0.1819915771484375, 0.21578598022460938, 0.24958038330078125, 0.2833747863769531, 0.317169189453125, 0.3509635925292969, 0.38475799560546875, 0.4185523986816406, 0.4523468017578125, 0.4861412048339844, 0.5199356079101562, 0.5537300109863281, 0.5875244140625, 0.6213188171386719, 0.6551132202148438, 0.6889076232910156, 0.7227020263671875, 0.7564964294433594, 0.7902908325195312, 0.8240852355957031, 0.857879638671875, 0.8916740417480469, 0.9254684448242188, 0.9592628479003906, 0.9930572509765625, 1.0268516540527344, 1.0606460571289062, 1.0944404602050781, 1.12823486328125, 1.1620292663574219, 1.1958236694335938, 1.2296180725097656, 1.2634124755859375, 1.2972068786621094, 1.3310012817382812, 1.3647956848144531, 1.398590087890625, 1.4323844909667969, 1.4661788940429688, 1.4999732971191406, 1.5337677001953125, 1.5675621032714844, 1.6013565063476562, 1.6351509094238281, 1.6689453125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 27.0, 85.0, 331.0, 327.0, 118.0, 51.0, 21.0, 4.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.815892219543457, -4.636350154876709, -4.456808090209961, -4.277266025543213, -4.097723960876465, -3.918181896209717, -3.7386395931243896, -3.5590975284576416, -3.3795554637908936, -3.2000133991241455, -3.0204713344573975, -2.8409290313720703, -2.6613869667053223, -2.481844902038574, -2.302302837371826, -2.122760772705078, -1.94321870803833, -1.763676643371582, -1.584134578704834, -1.4045923948287964, -1.2250503301620483, -1.0455082654953003, -0.8659660816192627, -0.6864240169525146, -0.5068819522857666, -0.32733985781669617, -0.14779776334762573, 0.03174436092376709, 0.21128642559051514, 0.3908284902572632, 0.5703706741333008, 0.7499127388000488, 0.9294543266296387, 1.1089963912963867, 1.2885384559631348, 1.4680806398391724, 1.6476227045059204, 1.8271647691726685, 2.006706953048706, 2.186249017715454, 2.365791082382202, 2.54533314704895, 2.7248752117156982, 2.9044175148010254, 3.0839595794677734, 3.2635016441345215, 3.4430437088012695, 3.6225857734680176, 3.8021278381347656, 3.9816699028015137, 4.161211967468262, 4.34075403213501, 4.520296096801758, 4.699838161468506, 4.879380226135254, 5.05892276763916, 5.23846435546875, 5.418006420135498, 5.597548484802246, 5.777090549468994, 5.956632614135742, 6.13617467880249, 6.315716743469238, 6.4952592849731445, 6.674801349639893]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 4.0, 6.0, 12.0, 15.0, 22.0, 35.0, 44.0, 47.0, 56.0, 73.0, 69.0, 97.0, 80.0, 60.0, 70.0, 79.0, 45.0, 54.0, 41.0, 25.0, 24.0, 8.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6425580978393555, -4.530004501342773, -4.417450904846191, -4.304897308349609, -4.192343711853027, -4.079790115356445, -3.967236280441284, -3.854682683944702, -3.74212908744812, -3.629575490951538, -3.517021894454956, -3.404468297958374, -3.291914463043213, -3.179360866546631, -3.066807270050049, -2.954253673553467, -2.8417000770568848, -2.7291464805603027, -2.6165928840637207, -2.5040392875671387, -2.3914856910705566, -2.2789320945739746, -2.1663782596588135, -2.0538246631622314, -1.9412710666656494, -1.8287174701690674, -1.7161638736724854, -1.6036101579666138, -1.4910565614700317, -1.3785029649734497, -1.2659492492675781, -1.153395652770996, -1.040842056274414, -0.928288459777832, -0.8157348036766052, -0.7031811475753784, -0.5906275510787964, -0.47807395458221436, -0.36552029848098755, -0.25296664237976074, -0.1404130458831787, -0.027859419584274292, 0.08469420671463013, 0.19724783301353455, 0.30980145931243896, 0.422355055809021, 0.5349087119102478, 0.6474623680114746, 0.7600159645080566, 0.8725695610046387, 0.9851232171058655, 1.0976768732070923, 1.2102304697036743, 1.3227840662002563, 1.435337781906128, 1.54789137840271, 1.660444974899292, 1.772998571395874, 1.885552167892456, 1.9981058835983276, 2.110659599304199, 2.2232131958007812, 2.3357667922973633, 2.4483203887939453, 2.5608739852905273]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 11.0, 17.0, 42.0, 36.0, 76.0, 107.0, 162.0, 304.0, 520.0, 1042.0, 2210.0, 5132.0, 14156.0, 47593.0, 202681.0, 527691.0, 181051.0, 43377.0, 13136.0, 4888.0, 2047.0, 997.0, 498.0, 313.0, 168.0, 95.0, 52.0, 45.0, 38.0, 15.0, 13.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.385986328125, -0.374786376953125, -0.36358642578125, -0.352386474609375, -0.3411865234375, -0.329986572265625, -0.31878662109375, -0.307586669921875, -0.29638671875, -0.285186767578125, -0.27398681640625, -0.262786865234375, -0.2515869140625, -0.240386962890625, -0.22918701171875, -0.217987060546875, -0.206787109375, -0.195587158203125, -0.18438720703125, -0.173187255859375, -0.1619873046875, -0.150787353515625, -0.13958740234375, -0.128387451171875, -0.1171875, -0.105987548828125, -0.09478759765625, -0.083587646484375, -0.0723876953125, -0.061187744140625, -0.04998779296875, -0.038787841796875, -0.027587890625, -0.016387939453125, -0.00518798828125, 0.006011962890625, 0.0172119140625, 0.028411865234375, 0.03961181640625, 0.050811767578125, 0.06201171875, 0.073211669921875, 0.08441162109375, 0.095611572265625, 0.1068115234375, 0.118011474609375, 0.12921142578125, 0.140411376953125, 0.151611328125, 0.162811279296875, 0.17401123046875, 0.185211181640625, 0.1964111328125, 0.207611083984375, 0.21881103515625, 0.230010986328125, 0.2412109375, 0.252410888671875, 0.26361083984375, 0.274810791015625, 0.2860107421875, 0.297210693359375, 0.30841064453125, 0.319610595703125, 0.330810546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 16.0, 10.0, 13.0, 16.0, 20.0, 39.0, 41.0, 37.0, 54.0, 50.0, 67.0, 80.0, 81.0, 73.0, 62.0, 52.0, 65.0, 42.0, 51.0, 28.0, 30.0, 14.0, 14.0, 6.0, 10.0, 10.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28662109375, -0.27581787109375, -0.2650146484375, -0.25421142578125, -0.243408203125, -0.23260498046875, -0.2218017578125, -0.21099853515625, -0.2001953125, -0.18939208984375, -0.1785888671875, -0.16778564453125, -0.156982421875, -0.14617919921875, -0.1353759765625, -0.12457275390625, -0.11376953125, -0.10296630859375, -0.0921630859375, -0.08135986328125, -0.070556640625, -0.05975341796875, -0.0489501953125, -0.03814697265625, -0.02734375, -0.01654052734375, -0.0057373046875, 0.00506591796875, 0.015869140625, 0.02667236328125, 0.0374755859375, 0.04827880859375, 0.05908203125, 0.06988525390625, 0.0806884765625, 0.09149169921875, 0.102294921875, 0.11309814453125, 0.1239013671875, 0.13470458984375, 0.1455078125, 0.15631103515625, 0.1671142578125, 0.17791748046875, 0.188720703125, 0.19952392578125, 0.2103271484375, 0.22113037109375, 0.23193359375, 0.24273681640625, 0.2535400390625, 0.26434326171875, 0.275146484375, 0.28594970703125, 0.2967529296875, 0.30755615234375, 0.318359375, 0.32916259765625, 0.3399658203125, 0.35076904296875, 0.361572265625, 0.37237548828125, 0.3831787109375, 0.39398193359375, 0.40478515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 3.0, 4.0, 7.0, 12.0, 32.0, 40.0, 71.0, 171.0, 346.0, 1009.0, 4090.0, 196917.0, 836352.0, 7293.0, 1322.0, 472.0, 197.0, 92.0, 40.0, 30.0, 9.0, 13.0, 6.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.63671875, -1.5887603759765625, -1.540802001953125, -1.4928436279296875, -1.44488525390625, -1.3969268798828125, -1.348968505859375, -1.3010101318359375, -1.2530517578125, -1.2050933837890625, -1.157135009765625, -1.1091766357421875, -1.06121826171875, -1.0132598876953125, -0.965301513671875, -0.9173431396484375, -0.869384765625, -0.8214263916015625, -0.773468017578125, -0.7255096435546875, -0.67755126953125, -0.6295928955078125, -0.581634521484375, -0.5336761474609375, -0.4857177734375, -0.4377593994140625, -0.389801025390625, -0.3418426513671875, -0.29388427734375, -0.2459259033203125, -0.197967529296875, -0.1500091552734375, -0.10205078125, -0.0540924072265625, -0.006134033203125, 0.0418243408203125, 0.08978271484375, 0.1377410888671875, 0.185699462890625, 0.2336578369140625, 0.2816162109375, 0.3295745849609375, 0.377532958984375, 0.4254913330078125, 0.47344970703125, 0.5214080810546875, 0.569366455078125, 0.6173248291015625, 0.665283203125, 0.7132415771484375, 0.761199951171875, 0.8091583251953125, 0.85711669921875, 0.9050750732421875, 0.953033447265625, 1.0009918212890625, 1.0489501953125, 1.0969085693359375, 1.144866943359375, 1.1928253173828125, 1.24078369140625, 1.2887420654296875, 1.336700439453125, 1.3846588134765625, 1.4326171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 18.0, 30.0, 45.0, 93.0, 122.0, 126.0, 144.0, 143.0, 101.0, 70.0, 48.0, 27.0, 18.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.283203125, -3.1998291015625, -3.116455078125, -3.0330810546875, -2.94970703125, -2.8663330078125, -2.782958984375, -2.6995849609375, -2.6162109375, -2.5328369140625, -2.449462890625, -2.3660888671875, -2.28271484375, -2.1993408203125, -2.115966796875, -2.0325927734375, -1.94921875, -1.8658447265625, -1.782470703125, -1.6990966796875, -1.61572265625, -1.5323486328125, -1.448974609375, -1.3656005859375, -1.2822265625, -1.1988525390625, -1.115478515625, -1.0321044921875, -0.94873046875, -0.8653564453125, -0.781982421875, -0.6986083984375, -0.615234375, -0.5318603515625, -0.448486328125, -0.3651123046875, -0.28173828125, -0.1983642578125, -0.114990234375, -0.0316162109375, 0.0517578125, 0.1351318359375, 0.218505859375, 0.3018798828125, 0.38525390625, 0.4686279296875, 0.552001953125, 0.6353759765625, 0.71875, 0.8021240234375, 0.885498046875, 0.9688720703125, 1.05224609375, 1.1356201171875, 1.218994140625, 1.3023681640625, 1.3857421875, 1.4691162109375, 1.552490234375, 1.6358642578125, 1.71923828125, 1.8026123046875, 1.885986328125, 1.9693603515625, 2.052734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 8.0, 8.0, 7.0, 13.0, 23.0, 25.0, 39.0, 72.0, 129.0, 309.0, 1311.0, 16288.0, 989643.0, 37973.0, 1907.0, 409.0, 166.0, 82.0, 41.0, 35.0, 17.0, 9.0, 11.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47021484375, -0.45377349853515625, -0.4373321533203125, -0.42089080810546875, -0.404449462890625, -0.38800811767578125, -0.3715667724609375, -0.35512542724609375, -0.33868408203125, -0.32224273681640625, -0.3058013916015625, -0.28936004638671875, -0.272918701171875, -0.25647735595703125, -0.2400360107421875, -0.22359466552734375, -0.2071533203125, -0.19071197509765625, -0.1742706298828125, -0.15782928466796875, -0.141387939453125, -0.12494659423828125, -0.1085052490234375, -0.09206390380859375, -0.07562255859375, -0.05918121337890625, -0.0427398681640625, -0.02629852294921875, -0.009857177734375, 0.00658416748046875, 0.0230255126953125, 0.03946685791015625, 0.055908203125, 0.07234954833984375, 0.0887908935546875, 0.10523223876953125, 0.121673583984375, 0.13811492919921875, 0.1545562744140625, 0.17099761962890625, 0.18743896484375, 0.20388031005859375, 0.2203216552734375, 0.23676300048828125, 0.253204345703125, 0.26964569091796875, 0.2860870361328125, 0.30252838134765625, 0.3189697265625, 0.33541107177734375, 0.3518524169921875, 0.36829376220703125, 0.384735107421875, 0.40117645263671875, 0.4176177978515625, 0.43405914306640625, 0.45050048828125, 0.46694183349609375, 0.4833831787109375, 0.49982452392578125, 0.516265869140625, 0.5327072143554688, 0.5491485595703125, 0.5655899047851562, 0.58203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 6.0, 4.0, 5.0, 3.0, 5.0, 2.0, 6.0, 7.0, 11.0, 8.0, 9.0, 20.0, 27.0, 27.0, 49.0, 98.0, 122.0, 173.0, 140.0, 99.0, 50.0, 37.0, 16.0, 15.0, 15.0, 8.0, 8.0, 9.0, 2.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.423494338989258e-05, -9.103305637836456e-05, -8.783116936683655e-05, -8.462928235530853e-05, -8.142739534378052e-05, -7.82255083322525e-05, -7.502362132072449e-05, -7.182173430919647e-05, -6.861984729766846e-05, -6.541796028614044e-05, -6.221607327461243e-05, -5.901418626308441e-05, -5.5812299251556396e-05, -5.261041224002838e-05, -4.9408525228500366e-05, -4.620663821697235e-05, -4.3004751205444336e-05, -3.980286419391632e-05, -3.6600977182388306e-05, -3.339909017086029e-05, -3.0197203159332275e-05, -2.699531614780426e-05, -2.3793429136276245e-05, -2.059154212474823e-05, -1.7389655113220215e-05, -1.41877681016922e-05, -1.0985881090164185e-05, -7.78399407863617e-06, -4.582107067108154e-06, -1.3802200555801392e-06, 1.821666955947876e-06, 5.023553967475891e-06, 8.225440979003906e-06, 1.1427327990531921e-05, 1.4629215002059937e-05, 1.783110201358795e-05, 2.1032989025115967e-05, 2.4234876036643982e-05, 2.7436763048171997e-05, 3.063865005970001e-05, 3.384053707122803e-05, 3.704242408275604e-05, 4.024431109428406e-05, 4.344619810581207e-05, 4.664808511734009e-05, 4.98499721288681e-05, 5.305185914039612e-05, 5.625374615192413e-05, 5.945563316345215e-05, 6.265752017498016e-05, 6.585940718650818e-05, 6.90612941980362e-05, 7.226318120956421e-05, 7.546506822109222e-05, 7.866695523262024e-05, 8.186884224414825e-05, 8.507072925567627e-05, 8.827261626720428e-05, 9.14745032787323e-05, 9.467639029026031e-05, 9.787827730178833e-05, 0.00010108016431331635, 0.00010428205132484436, 0.00010748393833637238, 0.00011068582534790039]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 18.0, 19.0, 23.0, 35.0, 54.0, 84.0, 158.0, 310.0, 699.0, 1984.0, 10839.0, 240039.0, 766955.0, 22399.0, 3153.0, 899.0, 392.0, 180.0, 117.0, 73.0, 41.0, 21.0, 17.0, 12.0, 12.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2479248046875, -0.2380695343017578, -0.22821426391601562, -0.21835899353027344, -0.20850372314453125, -0.19864845275878906, -0.18879318237304688, -0.1789379119873047, -0.1690826416015625, -0.1592273712158203, -0.14937210083007812, -0.13951683044433594, -0.12966156005859375, -0.11980628967285156, -0.10995101928710938, -0.10009574890136719, -0.090240478515625, -0.08038520812988281, -0.07052993774414062, -0.06067466735839844, -0.05081939697265625, -0.04096412658691406, -0.031108856201171875, -0.021253585815429688, -0.0113983154296875, -0.0015430450439453125, 0.008312225341796875, 0.018167495727539062, 0.02802276611328125, 0.03787803649902344, 0.047733306884765625, 0.05758857727050781, 0.06744384765625, 0.07729911804199219, 0.08715438842773438, 0.09700965881347656, 0.10686492919921875, 0.11672019958496094, 0.12657546997070312, 0.1364307403564453, 0.1462860107421875, 0.1561412811279297, 0.16599655151367188, 0.17585182189941406, 0.18570709228515625, 0.19556236267089844, 0.20541763305664062, 0.2152729034423828, 0.225128173828125, 0.2349834442138672, 0.24483871459960938, 0.25469398498535156, 0.26454925537109375, 0.27440452575683594, 0.2842597961425781, 0.2941150665283203, 0.3039703369140625, 0.3138256072998047, 0.3236808776855469, 0.33353614807128906, 0.34339141845703125, 0.35324668884277344, 0.3631019592285156, 0.3729572296142578, 0.3828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 2.0, 0.0, 4.0, 7.0, 6.0, 2.0, 7.0, 8.0, 16.0, 13.0, 23.0, 20.0, 31.0, 41.0, 61.0, 53.0, 70.0, 81.0, 110.0, 81.0, 75.0, 77.0, 54.0, 30.0, 24.0, 22.0, 21.0, 18.0, 7.0, 10.0, 2.0, 2.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2054443359375, -0.1993122100830078, -0.19318008422851562, -0.18704795837402344, -0.18091583251953125, -0.17478370666503906, -0.16865158081054688, -0.1625194549560547, -0.1563873291015625, -0.1502552032470703, -0.14412307739257812, -0.13799095153808594, -0.13185882568359375, -0.12572669982910156, -0.11959457397460938, -0.11346244812011719, -0.107330322265625, -0.10119819641113281, -0.09506607055664062, -0.08893394470214844, -0.08280181884765625, -0.07666969299316406, -0.07053756713867188, -0.06440544128417969, -0.0582733154296875, -0.05214118957519531, -0.046009063720703125, -0.03987693786621094, -0.03374481201171875, -0.027612686157226562, -0.021480560302734375, -0.015348434448242188, -0.00921630859375, -0.0030841827392578125, 0.003047943115234375, 0.009180068969726562, 0.01531219482421875, 0.021444320678710938, 0.027576446533203125, 0.03370857238769531, 0.0398406982421875, 0.04597282409667969, 0.052104949951171875, 0.05823707580566406, 0.06436920166015625, 0.07050132751464844, 0.07663345336914062, 0.08276557922363281, 0.088897705078125, 0.09502983093261719, 0.10116195678710938, 0.10729408264160156, 0.11342620849609375, 0.11955833435058594, 0.12569046020507812, 0.1318225860595703, 0.1379547119140625, 0.1440868377685547, 0.15021896362304688, 0.15635108947753906, 0.16248321533203125, 0.16861534118652344, 0.17474746704101562, 0.1808795928955078, 0.18701171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 10.0, 5.0, 13.0, 122.0, 668.0, 156.0, 21.0, 9.0, 1.0, 2.0, 1.0, 2.0], "bins": [-26.998016357421875, -26.521320343017578, -26.04462242126465, -25.56792640686035, -25.091230392456055, -24.614534378051758, -24.137836456298828, -23.66114044189453, -23.184444427490234, -22.707748413085938, -22.231050491333008, -21.75435447692871, -21.277658462524414, -20.800962448120117, -20.324264526367188, -19.84756851196289, -19.370872497558594, -18.894176483154297, -18.417478561401367, -17.94078254699707, -17.464086532592773, -16.987390518188477, -16.510692596435547, -16.03399658203125, -15.55729866027832, -15.080601692199707, -14.60390567779541, -14.127208709716797, -13.6505126953125, -13.173815727233887, -12.697118759155273, -12.220422744750977, -11.743725776672363, -11.26702880859375, -10.790332794189453, -10.31363582611084, -9.836939811706543, -9.36024284362793, -8.883546829223633, -8.40684986114502, -7.9301533699035645, -7.453456878662109, -6.976760387420654, -6.500063896179199, -6.023366928100586, -5.546670913696289, -5.069973945617676, -4.593277454376221, -4.116580963134766, -3.6398844718933105, -3.1631879806518555, -2.6864912509918213, -2.209794759750366, -1.7330982685089111, -1.256401538848877, -0.7797050476074219, -0.3030085563659668, 0.17368799448013306, 0.6503845453262329, 1.1270811557769775, 1.6037776470184326, 2.0804741382598877, 2.557170867919922, 3.033867359161377, 3.510563850402832]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 21.0, 25.0, 26.0, 39.0, 67.0, 70.0, 77.0, 98.0, 119.0, 105.0, 71.0, 62.0, 56.0, 43.0, 36.0, 27.0, 14.0, 13.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.415787696838379, -7.1360368728637695, -6.856285572052002, -6.576534748077393, -6.296783447265625, -6.017032623291016, -5.737281799316406, -5.457530498504639, -5.177779197692871, -4.898028373718262, -4.618277072906494, -4.338526248931885, -4.058774948120117, -3.779024124145508, -3.4992730617523193, -3.219521999359131, -2.9397711753845215, -2.660020112991333, -2.3802690505981445, -2.100518226623535, -1.8207670450210571, -1.5410159826278687, -1.2612650394439697, -0.9815139770507812, -0.7017629146575928, -0.4220118820667267, -0.1422608494758606, 0.1374901533126831, 0.4172412157058716, 0.6969922780990601, 0.976743221282959, 1.2564942836761475, 1.536245346069336, 1.8159964084625244, 2.095747470855713, 2.3754982948303223, 2.65524959564209, 2.935000419616699, 3.2147514820098877, 3.494502544403076, 3.7742536067962646, 4.054004669189453, 4.3337554931640625, 4.61350679397583, 4.8932576179504395, 5.173008918762207, 5.452759742736816, 5.732510566711426, 6.012261867523193, 6.292012691497803, 6.57176399230957, 6.85151481628418, 7.131266117095947, 7.411016941070557, 7.690768241882324, 7.970519065856934, 8.250269889831543, 8.530020713806152, 8.809771537780762, 9.089523315429688, 9.369274139404297, 9.649024963378906, 9.928775787353516, 10.208526611328125, 10.48827838897705]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 24.0, 28.0, 36.0, 51.0, 99.0, 166.0, 275.0, 457.0, 849.0, 1675.0, 3999.0, 10788.0, 41336.0, 343174.0, 2739414.0, 942847.0, 83579.0, 15686.0, 5074.0, 2144.0, 1051.0, 571.0, 336.0, 212.0, 136.0, 82.0, 61.0, 34.0, 25.0, 16.0, 12.0, 7.0, 6.0, 3.0, 3.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.192169189453125, -0.18438720703125, -0.176605224609375, -0.1688232421875, -0.161041259765625, -0.15325927734375, -0.145477294921875, -0.1376953125, -0.129913330078125, -0.12213134765625, -0.114349365234375, -0.1065673828125, -0.098785400390625, -0.09100341796875, -0.083221435546875, -0.075439453125, -0.067657470703125, -0.05987548828125, -0.052093505859375, -0.0443115234375, -0.036529541015625, -0.02874755859375, -0.020965576171875, -0.01318359375, -0.005401611328125, 0.00238037109375, 0.010162353515625, 0.0179443359375, 0.025726318359375, 0.03350830078125, 0.041290283203125, 0.049072265625, 0.056854248046875, 0.06463623046875, 0.072418212890625, 0.0802001953125, 0.087982177734375, 0.09576416015625, 0.103546142578125, 0.111328125, 0.119110107421875, 0.12689208984375, 0.134674072265625, 0.1424560546875, 0.150238037109375, 0.15802001953125, 0.165802001953125, 0.173583984375, 0.181365966796875, 0.18914794921875, 0.196929931640625, 0.2047119140625, 0.212493896484375, 0.22027587890625, 0.228057861328125, 0.23583984375, 0.243621826171875, 0.25140380859375, 0.259185791015625, 0.2669677734375, 0.274749755859375, 0.28253173828125, 0.290313720703125, 0.298095703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 10.0, 6.0, 16.0, 16.0, 17.0, 17.0, 40.0, 45.0, 43.0, 42.0, 49.0, 50.0, 66.0, 55.0, 68.0, 53.0, 66.0, 58.0, 53.0, 45.0, 31.0, 40.0, 38.0, 20.0, 15.0, 6.0, 8.0, 9.0, 6.0, 6.0, 1.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.23091697692871094, -0.22245407104492188, -0.2139911651611328, -0.20552825927734375, -0.1970653533935547, -0.18860244750976562, -0.18013954162597656, -0.1716766357421875, -0.16321372985839844, -0.15475082397460938, -0.1462879180908203, -0.13782501220703125, -0.1293621063232422, -0.12089920043945312, -0.11243629455566406, -0.103973388671875, -0.09551048278808594, -0.08704757690429688, -0.07858467102050781, -0.07012176513671875, -0.06165885925292969, -0.053195953369140625, -0.04473304748535156, -0.0362701416015625, -0.027807235717773438, -0.019344329833984375, -0.010881423950195312, -0.00241851806640625, 0.0060443878173828125, 0.014507293701171875, 0.022970199584960938, 0.03143310546875, 0.03989601135253906, 0.048358917236328125, 0.05682182312011719, 0.06528472900390625, 0.07374763488769531, 0.08221054077148438, 0.09067344665527344, 0.0991363525390625, 0.10759925842285156, 0.11606216430664062, 0.12452507019042969, 0.13298797607421875, 0.1414508819580078, 0.14991378784179688, 0.15837669372558594, 0.166839599609375, 0.17530250549316406, 0.18376541137695312, 0.1922283172607422, 0.20069122314453125, 0.2091541290283203, 0.21761703491210938, 0.22607994079589844, 0.2345428466796875, 0.24300575256347656, 0.2514686584472656, 0.2599315643310547, 0.26839447021484375, 0.2768573760986328, 0.2853202819824219, 0.29378318786621094, 0.30224609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 2.0, 6.0, 10.0, 6.0, 17.0, 25.0, 30.0, 51.0, 61.0, 120.0, 189.0, 306.0, 642.0, 1488.0, 3878.0, 13195.0, 61977.0, 902355.0, 3074858.0, 107887.0, 18558.0, 5176.0, 1772.0, 780.0, 376.0, 181.0, 97.0, 67.0, 51.0, 28.0, 24.0, 22.0, 14.0, 12.0, 5.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3577728271484375, -0.346649169921875, -0.3355255126953125, -0.32440185546875, -0.3132781982421875, -0.302154541015625, -0.2910308837890625, -0.2799072265625, -0.2687835693359375, -0.257659912109375, -0.2465362548828125, -0.23541259765625, -0.2242889404296875, -0.213165283203125, -0.2020416259765625, -0.19091796875, -0.1797943115234375, -0.168670654296875, -0.1575469970703125, -0.14642333984375, -0.1352996826171875, -0.124176025390625, -0.1130523681640625, -0.1019287109375, -0.0908050537109375, -0.079681396484375, -0.0685577392578125, -0.05743408203125, -0.0463104248046875, -0.035186767578125, -0.0240631103515625, -0.012939453125, -0.0018157958984375, 0.009307861328125, 0.0204315185546875, 0.03155517578125, 0.0426788330078125, 0.053802490234375, 0.0649261474609375, 0.0760498046875, 0.0871734619140625, 0.098297119140625, 0.1094207763671875, 0.12054443359375, 0.1316680908203125, 0.142791748046875, 0.1539154052734375, 0.1650390625, 0.1761627197265625, 0.187286376953125, 0.1984100341796875, 0.20953369140625, 0.2206573486328125, 0.231781005859375, 0.2429046630859375, 0.2540283203125, 0.2651519775390625, 0.276275634765625, 0.2873992919921875, 0.29852294921875, 0.3096466064453125, 0.320770263671875, 0.3318939208984375, 0.343017578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 7.0, 12.0, 16.0, 19.0, 23.0, 45.0, 42.0, 80.0, 139.0, 300.0, 676.0, 1110.0, 872.0, 353.0, 141.0, 88.0, 40.0, 25.0, 21.0, 14.0, 11.0, 6.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.5779876708984375, -0.561248779296875, -0.5445098876953125, -0.52777099609375, -0.5110321044921875, -0.494293212890625, -0.4775543212890625, -0.4608154296875, -0.4440765380859375, -0.427337646484375, -0.4105987548828125, -0.39385986328125, -0.3771209716796875, -0.360382080078125, -0.3436431884765625, -0.326904296875, -0.3101654052734375, -0.293426513671875, -0.2766876220703125, -0.25994873046875, -0.2432098388671875, -0.226470947265625, -0.2097320556640625, -0.1929931640625, -0.1762542724609375, -0.159515380859375, -0.1427764892578125, -0.12603759765625, -0.1092987060546875, -0.092559814453125, -0.0758209228515625, -0.05908203125, -0.0423431396484375, -0.025604248046875, -0.0088653564453125, 0.00787353515625, 0.0246124267578125, 0.041351318359375, 0.0580902099609375, 0.0748291015625, 0.0915679931640625, 0.108306884765625, 0.1250457763671875, 0.14178466796875, 0.1585235595703125, 0.175262451171875, 0.1920013427734375, 0.208740234375, 0.2254791259765625, 0.242218017578125, 0.2589569091796875, 0.27569580078125, 0.2924346923828125, 0.309173583984375, 0.3259124755859375, 0.3426513671875, 0.3593902587890625, 0.376129150390625, 0.3928680419921875, 0.40960693359375, 0.4263458251953125, 0.443084716796875, 0.4598236083984375, 0.4765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 11.0, 51.0, 413.0, 455.0, 43.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.742006301879883, -6.437751293182373, -6.133496284484863, -5.829241752624512, -5.524986743927002, -5.220731735229492, -4.916477203369141, -4.612222194671631, -4.307967185974121, -4.003712177276611, -3.6994574069976807, -3.39520263671875, -3.0909476280212402, -2.7866926193237305, -2.4824378490448, -2.178183078765869, -1.8739280700683594, -1.5696731805801392, -1.265418291091919, -0.9611634016036987, -0.6569085121154785, -0.3526536226272583, -0.048398733139038086, 0.2558560371398926, 0.5601110458374023, 0.8643659353256226, 1.1686208248138428, 1.472875714302063, 1.7771306037902832, 2.081385612487793, 2.3856403827667236, 2.6898951530456543, 2.994150161743164, 3.298405170440674, 3.6026599407196045, 3.906914710998535, 4.211169719696045, 4.515424728393555, 4.819679260253906, 5.123934268951416, 5.428189277648926, 5.7324442863464355, 6.036699295043945, 6.340953826904297, 6.645208835601807, 6.949463844299316, 7.253718376159668, 7.557973384857178, 7.8622283935546875, 8.166482925415039, 8.470738410949707, 8.774992942810059, 9.079248428344727, 9.383502960205078, 9.68775749206543, 9.992012023925781, 10.29626750946045, 10.6005220413208, 10.904777526855469, 11.20903205871582, 11.513286590576172, 11.81754207611084, 12.121796607971191, 12.42605209350586, 12.730306625366211]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 9.0, 15.0, 16.0, 19.0, 23.0, 22.0, 26.0, 49.0, 42.0, 48.0, 47.0, 55.0, 68.0, 63.0, 63.0, 53.0, 53.0, 48.0, 39.0, 29.0, 33.0, 33.0, 22.0, 14.0, 23.0, 22.0, 11.0, 12.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.8203125, -2.743502140045166, -2.666692018508911, -2.589881658554077, -2.513071298599243, -2.4362611770629883, -2.3594508171081543, -2.2826404571533203, -2.2058303356170654, -2.1290199756622314, -2.0522098541259766, -1.9753994941711426, -1.8985892534255981, -1.8217790126800537, -1.7449686527252197, -1.6681584119796753, -1.5913480520248413, -1.5145378112792969, -1.437727451324463, -1.3609172105789185, -1.284106969833374, -1.20729660987854, -1.1304863691329956, -1.0536761283874512, -0.976865828037262, -0.9000555276870728, -0.8232452869415283, -0.7464349865913391, -0.6696246862411499, -0.5928144454956055, -0.5160041451454163, -0.4391939043998718, -0.3623836040496826, -0.2855733335018158, -0.20876304805278778, -0.13195276260375977, -0.055142492055892944, 0.021667778491973877, 0.09847807884216309, 0.17528831958770752, 0.25209861993789673, 0.32890889048576355, 0.40571916103363037, 0.4825294613838196, 0.5593397617340088, 0.6361500024795532, 0.7129603028297424, 0.7897705435752869, 0.8665808439254761, 0.9433911442756653, 1.0202014446258545, 1.097011685371399, 1.1738219261169434, 1.2506322860717773, 1.3274425268173218, 1.4042527675628662, 1.4810631275177002, 1.5578733682632446, 1.6346837282180786, 1.711493968963623, 1.7883042097091675, 1.865114450454712, 1.941924810409546, 2.018734931945801, 2.0955452919006348]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 9.0, 23.0, 28.0, 49.0, 63.0, 122.0, 251.0, 576.0, 1128.0, 2526.0, 6484.0, 18139.0, 60105.0, 212759.0, 434005.0, 219133.0, 62594.0, 18981.0, 6649.0, 2644.0, 1138.0, 538.0, 264.0, 150.0, 83.0, 35.0, 30.0, 17.0, 13.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.279296875, -0.2720451354980469, -0.26479339599609375, -0.2575416564941406, -0.2502899169921875, -0.24303817749023438, -0.23578643798828125, -0.22853469848632812, -0.221282958984375, -0.21403121948242188, -0.20677947998046875, -0.19952774047851562, -0.1922760009765625, -0.18502426147460938, -0.17777252197265625, -0.17052078247070312, -0.16326904296875, -0.15601730346679688, -0.14876556396484375, -0.14151382446289062, -0.1342620849609375, -0.12701034545898438, -0.11975860595703125, -0.11250686645507812, -0.105255126953125, -0.09800338745117188, -0.09075164794921875, -0.08349990844726562, -0.0762481689453125, -0.06899642944335938, -0.06174468994140625, -0.054492950439453125, -0.0472412109375, -0.039989471435546875, -0.03273773193359375, -0.025485992431640625, -0.0182342529296875, -0.010982513427734375, -0.00373077392578125, 0.003520965576171875, 0.010772705078125, 0.018024444580078125, 0.02527618408203125, 0.032527923583984375, 0.0397796630859375, 0.047031402587890625, 0.05428314208984375, 0.061534881591796875, 0.06878662109375, 0.07603836059570312, 0.08329010009765625, 0.09054183959960938, 0.0977935791015625, 0.10504531860351562, 0.11229705810546875, 0.11954879760742188, 0.126800537109375, 0.13405227661132812, 0.14130401611328125, 0.14855575561523438, 0.1558074951171875, 0.16305923461914062, 0.17031097412109375, 0.17756271362304688, 0.184814453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 4.0, 10.0, 13.0, 11.0, 14.0, 24.0, 23.0, 33.0, 37.0, 40.0, 47.0, 51.0, 42.0, 63.0, 64.0, 65.0, 62.0, 65.0, 60.0, 48.0, 37.0, 41.0, 27.0, 21.0, 26.0, 15.0, 16.0, 12.0, 7.0, 7.0, 9.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.242431640625, -0.23490333557128906, -0.22737503051757812, -0.2198467254638672, -0.21231842041015625, -0.2047901153564453, -0.19726181030273438, -0.18973350524902344, -0.1822052001953125, -0.17467689514160156, -0.16714859008789062, -0.1596202850341797, -0.15209197998046875, -0.1445636749267578, -0.13703536987304688, -0.12950706481933594, -0.121978759765625, -0.11445045471191406, -0.10692214965820312, -0.09939384460449219, -0.09186553955078125, -0.08433723449707031, -0.07680892944335938, -0.06928062438964844, -0.0617523193359375, -0.05422401428222656, -0.046695709228515625, -0.03916740417480469, -0.03163909912109375, -0.024110794067382812, -0.016582489013671875, -0.009054183959960938, -0.00152587890625, 0.0060024261474609375, 0.013530731201171875, 0.021059036254882812, 0.02858734130859375, 0.03611564636230469, 0.043643951416015625, 0.05117225646972656, 0.0587005615234375, 0.06622886657714844, 0.07375717163085938, 0.08128547668457031, 0.08881378173828125, 0.09634208679199219, 0.10387039184570312, 0.11139869689941406, 0.118927001953125, 0.12645530700683594, 0.13398361206054688, 0.1415119171142578, 0.14904022216796875, 0.1565685272216797, 0.16409683227539062, 0.17162513732910156, 0.1791534423828125, 0.18668174743652344, 0.19421005249023438, 0.2017383575439453, 0.20926666259765625, 0.2167949676513672, 0.22432327270507812, 0.23185157775878906, 0.2393798828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 7.0, 23.0, 23.0, 24.0, 41.0, 49.0, 54.0, 86.0, 104.0, 155.0, 197.0, 263.0, 362.0, 539.0, 977.0, 2155.0, 7831.0, 110065.0, 869469.0, 46473.0, 5273.0, 1727.0, 804.0, 491.0, 362.0, 232.0, 199.0, 128.0, 106.0, 82.0, 48.0, 40.0, 46.0, 19.0, 23.0, 14.0, 5.0, 8.0, 5.0, 8.0, 2.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.61962890625, -0.5992279052734375, -0.578826904296875, -0.5584259033203125, -0.53802490234375, -0.5176239013671875, -0.497222900390625, -0.4768218994140625, -0.4564208984375, -0.4360198974609375, -0.415618896484375, -0.3952178955078125, -0.37481689453125, -0.3544158935546875, -0.334014892578125, -0.3136138916015625, -0.293212890625, -0.2728118896484375, -0.252410888671875, -0.2320098876953125, -0.21160888671875, -0.1912078857421875, -0.170806884765625, -0.1504058837890625, -0.1300048828125, -0.1096038818359375, -0.089202880859375, -0.0688018798828125, -0.04840087890625, -0.0279998779296875, -0.007598876953125, 0.0128021240234375, 0.033203125, 0.0536041259765625, 0.074005126953125, 0.0944061279296875, 0.11480712890625, 0.1352081298828125, 0.155609130859375, 0.1760101318359375, 0.1964111328125, 0.2168121337890625, 0.237213134765625, 0.2576141357421875, 0.27801513671875, 0.2984161376953125, 0.318817138671875, 0.3392181396484375, 0.359619140625, 0.3800201416015625, 0.400421142578125, 0.4208221435546875, 0.44122314453125, 0.4616241455078125, 0.482025146484375, 0.5024261474609375, 0.5228271484375, 0.5432281494140625, 0.563629150390625, 0.5840301513671875, 0.60443115234375, 0.6248321533203125, 0.645233154296875, 0.6656341552734375, 0.68603515625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 5.0, 11.0, 16.0, 20.0, 29.0, 27.0, 35.0, 42.0, 48.0, 47.0, 56.0, 51.0, 66.0, 58.0, 58.0, 53.0, 62.0, 47.0, 39.0, 36.0, 27.0, 32.0, 31.0, 15.0, 21.0, 13.0, 10.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.912109375, -0.8802490234375, -0.848388671875, -0.8165283203125, -0.78466796875, -0.7528076171875, -0.720947265625, -0.6890869140625, -0.6572265625, -0.6253662109375, -0.593505859375, -0.5616455078125, -0.52978515625, -0.4979248046875, -0.466064453125, -0.4342041015625, -0.40234375, -0.3704833984375, -0.338623046875, -0.3067626953125, -0.27490234375, -0.2430419921875, -0.211181640625, -0.1793212890625, -0.1474609375, -0.1156005859375, -0.083740234375, -0.0518798828125, -0.02001953125, 0.0118408203125, 0.043701171875, 0.0755615234375, 0.107421875, 0.1392822265625, 0.171142578125, 0.2030029296875, 0.23486328125, 0.2667236328125, 0.298583984375, 0.3304443359375, 0.3623046875, 0.3941650390625, 0.426025390625, 0.4578857421875, 0.48974609375, 0.5216064453125, 0.553466796875, 0.5853271484375, 0.6171875, 0.6490478515625, 0.680908203125, 0.7127685546875, 0.74462890625, 0.7764892578125, 0.808349609375, 0.8402099609375, 0.8720703125, 0.9039306640625, 0.935791015625, 0.9676513671875, 0.99951171875, 1.0313720703125, 1.063232421875, 1.0950927734375, 1.126953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 12.0, 9.0, 20.0, 29.0, 31.0, 50.0, 68.0, 128.0, 208.0, 384.0, 794.0, 2284.0, 9180.0, 87153.0, 851462.0, 83802.0, 8998.0, 2164.0, 813.0, 352.0, 214.0, 106.0, 71.0, 59.0, 49.0, 29.0, 20.0, 8.0, 12.0, 3.0, 9.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1767578125, -0.17131805419921875, -0.1658782958984375, -0.16043853759765625, -0.154998779296875, -0.14955902099609375, -0.1441192626953125, -0.13867950439453125, -0.13323974609375, -0.12779998779296875, -0.1223602294921875, -0.11692047119140625, -0.111480712890625, -0.10604095458984375, -0.1006011962890625, -0.09516143798828125, -0.0897216796875, -0.08428192138671875, -0.0788421630859375, -0.07340240478515625, -0.067962646484375, -0.06252288818359375, -0.0570831298828125, -0.05164337158203125, -0.04620361328125, -0.04076385498046875, -0.0353240966796875, -0.02988433837890625, -0.024444580078125, -0.01900482177734375, -0.0135650634765625, -0.00812530517578125, -0.002685546875, 0.00275421142578125, 0.0081939697265625, 0.01363372802734375, 0.019073486328125, 0.02451324462890625, 0.0299530029296875, 0.03539276123046875, 0.04083251953125, 0.04627227783203125, 0.0517120361328125, 0.05715179443359375, 0.062591552734375, 0.06803131103515625, 0.0734710693359375, 0.07891082763671875, 0.0843505859375, 0.08979034423828125, 0.0952301025390625, 0.10066986083984375, 0.106109619140625, 0.11154937744140625, 0.1169891357421875, 0.12242889404296875, 0.12786865234375, 0.13330841064453125, 0.1387481689453125, 0.14418792724609375, 0.149627685546875, 0.15506744384765625, 0.1605072021484375, 0.16594696044921875, 0.17138671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 11.0, 17.0, 8.0, 14.0, 22.0, 22.0, 19.0, 28.0, 39.0, 37.0, 80.0, 104.0, 114.0, 105.0, 82.0, 76.0, 37.0, 28.0, 30.0, 23.0, 16.0, 15.0, 13.0, 13.0, 2.0, 5.0, 7.0, 3.0, 3.0, 0.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.455183029174805e-05, -6.225146353244781e-05, -5.995109677314758e-05, -5.765073001384735e-05, -5.535036325454712e-05, -5.304999649524689e-05, -5.0749629735946655e-05, -4.844926297664642e-05, -4.614889621734619e-05, -4.384852945804596e-05, -4.154816269874573e-05, -3.9247795939445496e-05, -3.6947429180145264e-05, -3.464706242084503e-05, -3.23466956615448e-05, -3.0046328902244568e-05, -2.7745962142944336e-05, -2.5445595383644104e-05, -2.3145228624343872e-05, -2.084486186504364e-05, -1.8544495105743408e-05, -1.6244128346443176e-05, -1.3943761587142944e-05, -1.1643394827842712e-05, -9.34302806854248e-06, -7.0426613092422485e-06, -4.742294549942017e-06, -2.4419277906417847e-06, -1.4156103134155273e-07, 2.158805727958679e-06, 4.459172487258911e-06, 6.759539246559143e-06, 9.059906005859375e-06, 1.1360272765159607e-05, 1.3660639524459839e-05, 1.596100628376007e-05, 1.8261373043060303e-05, 2.0561739802360535e-05, 2.2862106561660767e-05, 2.5162473320961e-05, 2.746284008026123e-05, 2.9763206839561462e-05, 3.2063573598861694e-05, 3.4363940358161926e-05, 3.666430711746216e-05, 3.896467387676239e-05, 4.126504063606262e-05, 4.3565407395362854e-05, 4.5865774154663086e-05, 4.816614091396332e-05, 5.046650767326355e-05, 5.276687443256378e-05, 5.5067241191864014e-05, 5.7367607951164246e-05, 5.966797471046448e-05, 6.196834146976471e-05, 6.426870822906494e-05, 6.656907498836517e-05, 6.88694417476654e-05, 7.116980850696564e-05, 7.347017526626587e-05, 7.57705420255661e-05, 7.807090878486633e-05, 8.037127554416656e-05, 8.26716423034668e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 10.0, 1.0, 8.0, 9.0, 14.0, 18.0, 28.0, 32.0, 50.0, 67.0, 103.0, 141.0, 236.0, 409.0, 960.0, 2467.0, 9103.0, 70661.0, 861162.0, 87714.0, 10497.0, 2699.0, 996.0, 439.0, 255.0, 134.0, 112.0, 70.0, 42.0, 33.0, 20.0, 12.0, 12.0, 7.0, 7.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18658828735351562, -0.18067169189453125, -0.17475509643554688, -0.1688385009765625, -0.16292190551757812, -0.15700531005859375, -0.15108871459960938, -0.145172119140625, -0.13925552368164062, -0.13333892822265625, -0.12742233276367188, -0.1215057373046875, -0.11558914184570312, -0.10967254638671875, -0.10375595092773438, -0.09783935546875, -0.09192276000976562, -0.08600616455078125, -0.08008956909179688, -0.0741729736328125, -0.06825637817382812, -0.06233978271484375, -0.056423187255859375, -0.050506591796875, -0.044589996337890625, -0.03867340087890625, -0.032756805419921875, -0.0268402099609375, -0.020923614501953125, -0.01500701904296875, -0.009090423583984375, -0.003173828125, 0.002742767333984375, 0.00865936279296875, 0.014575958251953125, 0.0204925537109375, 0.026409149169921875, 0.03232574462890625, 0.038242340087890625, 0.044158935546875, 0.050075531005859375, 0.05599212646484375, 0.061908721923828125, 0.0678253173828125, 0.07374191284179688, 0.07965850830078125, 0.08557510375976562, 0.09149169921875, 0.09740829467773438, 0.10332489013671875, 0.10924148559570312, 0.1151580810546875, 0.12107467651367188, 0.12699127197265625, 0.13290786743164062, 0.138824462890625, 0.14474105834960938, 0.15065765380859375, 0.15657424926757812, 0.1624908447265625, 0.16840744018554688, 0.17432403564453125, 0.18024063110351562, 0.1861572265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 3.0, 8.0, 12.0, 8.0, 15.0, 19.0, 22.0, 32.0, 42.0, 55.0, 83.0, 73.0, 75.0, 101.0, 96.0, 64.0, 62.0, 43.0, 39.0, 32.0, 23.0, 26.0, 12.0, 13.0, 8.0, 2.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1324462890625, -0.12774085998535156, -0.12303543090820312, -0.11833000183105469, -0.11362457275390625, -0.10891914367675781, -0.10421371459960938, -0.09950828552246094, -0.0948028564453125, -0.09009742736816406, -0.08539199829101562, -0.08068656921386719, -0.07598114013671875, -0.07127571105957031, -0.06657028198242188, -0.06186485290527344, -0.057159423828125, -0.05245399475097656, -0.047748565673828125, -0.04304313659667969, -0.03833770751953125, -0.03363227844238281, -0.028926849365234375, -0.024221420288085938, -0.0195159912109375, -0.014810562133789062, -0.010105133056640625, -0.0053997039794921875, -0.00069427490234375, 0.0040111541748046875, 0.008716583251953125, 0.013422012329101562, 0.01812744140625, 0.022832870483398438, 0.027538299560546875, 0.03224372863769531, 0.03694915771484375, 0.04165458679199219, 0.046360015869140625, 0.05106544494628906, 0.0557708740234375, 0.06047630310058594, 0.06518173217773438, 0.06988716125488281, 0.07459259033203125, 0.07929801940917969, 0.08400344848632812, 0.08870887756347656, 0.093414306640625, 0.09811973571777344, 0.10282516479492188, 0.10753059387207031, 0.11223602294921875, 0.11694145202636719, 0.12164688110351562, 0.12635231018066406, 0.1310577392578125, 0.13576316833496094, 0.14046859741210938, 0.1451740264892578, 0.14987945556640625, 0.1545848846435547, 0.15929031372070312, 0.16399574279785156, 0.168701171875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 13.0, 28.0, 146.0, 511.0, 201.0, 45.0, 21.0, 14.0, 10.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8624258041381836, -2.634716510772705, -2.4070072174072266, -2.179297924041748, -1.9515886306762695, -1.723879337310791, -1.4961700439453125, -1.268460750579834, -1.0407514572143555, -0.813042163848877, -0.5853328704833984, -0.3576235771179199, -0.1299142837524414, 0.09779500961303711, 0.3255043029785156, 0.5532135963439941, 0.7809228897094727, 1.0086321830749512, 1.2363414764404297, 1.4640507698059082, 1.6917600631713867, 1.9194693565368652, 2.1471786499023438, 2.3748879432678223, 2.602597236633301, 2.8303065299987793, 3.058015823364258, 3.2857251167297363, 3.513434410095215, 3.7411437034606934, 3.968852996826172, 4.19656229019165, 4.424271583557129, 4.651980876922607, 4.879690170288086, 5.1073994636535645, 5.335108757019043, 5.5628180503845215, 5.79052734375, 6.0182366371154785, 6.245945930480957, 6.4736552238464355, 6.701364517211914, 6.929073810577393, 7.156783103942871, 7.38449239730835, 7.612201690673828, 7.839910984039307, 8.067620277404785, 8.295330047607422, 8.523038864135742, 8.750747680664062, 8.9784574508667, 9.206167221069336, 9.433876037597656, 9.661584854125977, 9.889294624328613, 10.11700439453125, 10.34471321105957, 10.57242202758789, 10.800131797790527, 11.027841567993164, 11.255550384521484, 11.483259201049805, 11.710968971252441]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 3.0, 8.0, 11.0, 10.0, 12.0, 25.0, 16.0, 28.0, 25.0, 33.0, 36.0, 39.0, 44.0, 37.0, 53.0, 82.0, 82.0, 70.0, 60.0, 51.0, 45.0, 40.0, 29.0, 24.0, 16.0, 11.0, 20.0, 21.0, 20.0, 12.0, 7.0, 8.0, 7.0, 4.0, 3.0, 7.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.527020454406738, -4.412191390991211, -4.297362327575684, -4.182532787322998, -4.067703723907471, -3.9528746604919434, -3.838045597076416, -3.7232162952423096, -3.6083872318267822, -3.493558168411255, -3.3787288665771484, -3.263899803161621, -3.1490705013275146, -3.0342414379119873, -2.919412136077881, -2.8045830726623535, -2.689754009246826, -2.574924945831299, -2.4600956439971924, -2.345266580581665, -2.2304372787475586, -2.1156082153320312, -2.000779151916504, -1.8859498500823975, -1.771120548248291, -1.6562913656234741, -1.5414621829986572, -1.4266331195831299, -1.311803936958313, -1.196974754333496, -1.0821455717086792, -0.9673164486885071, -0.852487325668335, -0.7376581430435181, -0.622829020023346, -0.507999837398529, -0.39317068457603455, -0.27834153175354004, -0.16351234912872314, -0.048683226108551025, 0.06614595651626587, 0.18097510933876038, 0.2958042621612549, 0.4106334447860718, 0.5254626274108887, 0.6402917504310608, 0.7551209330558777, 0.8699500560760498, 0.9847792387008667, 1.0996084213256836, 1.2144376039505005, 1.3292667865753174, 1.4440958499908447, 1.5589250326156616, 1.6737542152404785, 1.7885832786560059, 1.9034125804901123, 2.0182416439056396, 2.133070945739746, 2.2479000091552734, 2.36272931098938, 2.4775583744049072, 2.5923876762390137, 2.707216739654541, 2.8220458030700684]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 2.0, 7.0, 13.0, 14.0, 24.0, 39.0, 42.0, 80.0, 101.0, 176.0, 338.0, 637.0, 1406.0, 3165.0, 8699.0, 30127.0, 190516.0, 1707763.0, 1949170.0, 246779.0, 37120.0, 10003.0, 4015.0, 1908.0, 1012.0, 507.0, 262.0, 121.0, 71.0, 48.0, 35.0, 19.0, 19.0, 7.0, 6.0, 9.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2349853515625, -0.22864341735839844, -0.22230148315429688, -0.2159595489501953, -0.20961761474609375, -0.2032756805419922, -0.19693374633789062, -0.19059181213378906, -0.1842498779296875, -0.17790794372558594, -0.17156600952148438, -0.1652240753173828, -0.15888214111328125, -0.1525402069091797, -0.14619827270507812, -0.13985633850097656, -0.133514404296875, -0.12717247009277344, -0.12083053588867188, -0.11448860168457031, -0.10814666748046875, -0.10180473327636719, -0.09546279907226562, -0.08912086486816406, -0.0827789306640625, -0.07643699645996094, -0.07009506225585938, -0.06375312805175781, -0.05741119384765625, -0.05106925964355469, -0.044727325439453125, -0.03838539123535156, -0.03204345703125, -0.025701522827148438, -0.019359588623046875, -0.013017654418945312, -0.00667572021484375, -0.0003337860107421875, 0.006008148193359375, 0.012350082397460938, 0.0186920166015625, 0.025033950805664062, 0.031375885009765625, 0.03771781921386719, 0.04405975341796875, 0.05040168762207031, 0.056743621826171875, 0.06308555603027344, 0.069427490234375, 0.07576942443847656, 0.08211135864257812, 0.08845329284667969, 0.09479522705078125, 0.10113716125488281, 0.10747909545898438, 0.11382102966308594, 0.1201629638671875, 0.12650489807128906, 0.13284683227539062, 0.1391887664794922, 0.14553070068359375, 0.1518726348876953, 0.15821456909179688, 0.16455650329589844, 0.1708984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 6.0, 8.0, 14.0, 24.0, 38.0, 54.0, 70.0, 79.0, 95.0, 95.0, 121.0, 73.0, 102.0, 83.0, 49.0, 30.0, 30.0, 18.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5141181945800781, -0.5018692016601562, -0.4896202087402344, -0.4773712158203125, -0.4651222229003906, -0.45287322998046875, -0.4406242370605469, -0.428375244140625, -0.4161262512207031, -0.40387725830078125, -0.3916282653808594, -0.3793792724609375, -0.3671302795410156, -0.35488128662109375, -0.3426322937011719, -0.33038330078125, -0.3181343078613281, -0.30588531494140625, -0.2936363220214844, -0.2813873291015625, -0.2691383361816406, -0.25688934326171875, -0.24464035034179688, -0.232391357421875, -0.22014236450195312, -0.20789337158203125, -0.19564437866210938, -0.1833953857421875, -0.17114639282226562, -0.15889739990234375, -0.14664840698242188, -0.1343994140625, -0.12215042114257812, -0.10990142822265625, -0.09765243530273438, -0.0854034423828125, -0.07315444946289062, -0.06090545654296875, -0.048656463623046875, -0.036407470703125, -0.024158477783203125, -0.01190948486328125, 0.000339508056640625, 0.0125885009765625, 0.024837493896484375, 0.03708648681640625, 0.049335479736328125, 0.06158447265625, 0.07383346557617188, 0.08608245849609375, 0.09833145141601562, 0.1105804443359375, 0.12282943725585938, 0.13507843017578125, 0.14732742309570312, 0.159576416015625, 0.17182540893554688, 0.18407440185546875, 0.19632339477539062, 0.2085723876953125, 0.22082138061523438, 0.23307037353515625, 0.24531936645507812, 0.257568359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 9.0, 10.0, 10.0, 20.0, 39.0, 74.0, 138.0, 257.0, 527.0, 954.0, 2175.0, 6902.0, 34552.0, 780462.0, 3288545.0, 67196.0, 8610.0, 2145.0, 753.0, 397.0, 209.0, 110.0, 68.0, 44.0, 24.0, 12.0, 15.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3837890625, -0.3714790344238281, -0.35916900634765625, -0.3468589782714844, -0.3345489501953125, -0.3222389221191406, -0.30992889404296875, -0.2976188659667969, -0.285308837890625, -0.2729988098144531, -0.26068878173828125, -0.24837875366210938, -0.2360687255859375, -0.22375869750976562, -0.21144866943359375, -0.19913864135742188, -0.18682861328125, -0.17451858520507812, -0.16220855712890625, -0.14989852905273438, -0.1375885009765625, -0.12527847290039062, -0.11296844482421875, -0.10065841674804688, -0.088348388671875, -0.07603836059570312, -0.06372833251953125, -0.051418304443359375, -0.0391082763671875, -0.026798248291015625, -0.01448822021484375, -0.002178192138671875, 0.0101318359375, 0.022441864013671875, 0.03475189208984375, 0.047061920166015625, 0.0593719482421875, 0.07168197631835938, 0.08399200439453125, 0.09630203247070312, 0.108612060546875, 0.12092208862304688, 0.13323211669921875, 0.14554214477539062, 0.1578521728515625, 0.17016220092773438, 0.18247222900390625, 0.19478225708007812, 0.20709228515625, 0.21940231323242188, 0.23171234130859375, 0.24402236938476562, 0.2563323974609375, 0.2686424255371094, 0.28095245361328125, 0.2932624816894531, 0.305572509765625, 0.3178825378417969, 0.33019256591796875, 0.3425025939941406, 0.3548126220703125, 0.3671226501464844, 0.37943267822265625, 0.3917427062988281, 0.404052734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 10.0, 19.0, 29.0, 45.0, 76.0, 170.0, 545.0, 1361.0, 1203.0, 376.0, 113.0, 50.0, 26.0, 10.0, 16.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5540847778320312, -0.5334625244140625, -0.5128402709960938, -0.492218017578125, -0.47159576416015625, -0.4509735107421875, -0.43035125732421875, -0.40972900390625, -0.38910675048828125, -0.3684844970703125, -0.34786224365234375, -0.327239990234375, -0.30661773681640625, -0.2859954833984375, -0.26537322998046875, -0.2447509765625, -0.22412872314453125, -0.2035064697265625, -0.18288421630859375, -0.162261962890625, -0.14163970947265625, -0.1210174560546875, -0.10039520263671875, -0.07977294921875, -0.05915069580078125, -0.0385284423828125, -0.01790618896484375, 0.002716064453125, 0.02333831787109375, 0.0439605712890625, 0.06458282470703125, 0.085205078125, 0.10582733154296875, 0.1264495849609375, 0.14707183837890625, 0.167694091796875, 0.18831634521484375, 0.2089385986328125, 0.22956085205078125, 0.25018310546875, 0.27080535888671875, 0.2914276123046875, 0.31204986572265625, 0.332672119140625, 0.35329437255859375, 0.3739166259765625, 0.39453887939453125, 0.4151611328125, 0.43578338623046875, 0.4564056396484375, 0.47702789306640625, 0.497650146484375, 0.5182723999023438, 0.5388946533203125, 0.5595169067382812, 0.58013916015625, 0.6007614135742188, 0.6213836669921875, 0.6420059204101562, 0.662628173828125, 0.6832504272460938, 0.7038726806640625, 0.7244949340820312, 0.7451171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 33.0, 119.0, 372.0, 340.0, 89.0, 14.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.320489883422852, -6.140018939971924, -5.959547996520996, -5.779077053070068, -5.598606109619141, -5.418135166168213, -5.237664222717285, -5.057193279266357, -4.87672233581543, -4.696251392364502, -4.515780448913574, -4.3353095054626465, -4.154838562011719, -3.974367618560791, -3.7938966751098633, -3.6134257316589355, -3.4329545497894287, -3.252483606338501, -3.0720126628875732, -2.8915417194366455, -2.7110707759857178, -2.53059983253479, -2.350128650665283, -2.1696577072143555, -1.9891868829727173, -1.8087159395217896, -1.6282449960708618, -1.4477739334106445, -1.2673029899597168, -1.086832046508789, -0.9063611030578613, -0.7258901596069336, -0.5454192161560059, -0.3649482727050781, -0.184477299451828, -0.004006326198577881, 0.17646461725234985, 0.3569355607032776, 0.5374065637588501, 0.7178775072097778, 0.8983484506607056, 1.0788193941116333, 1.259290337562561, 1.4397614002227783, 1.620232343673706, 1.8007032871246338, 1.9811742305755615, 2.1616451740264893, 2.342116117477417, 2.5225870609283447, 2.7030580043792725, 2.8835289478302, 3.063999891281128, 3.2444708347320557, 3.4249420166015625, 3.6054129600524902, 3.785883903503418, 3.9663548469543457, 4.146825790405273, 4.327296733856201, 4.507767677307129, 4.688238620758057, 4.868709564208984, 5.049180507659912, 5.22965145111084]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 8.0, 15.0, 9.0, 22.0, 20.0, 29.0, 36.0, 54.0, 62.0, 76.0, 82.0, 84.0, 80.0, 76.0, 77.0, 61.0, 54.0, 35.0, 30.0, 23.0, 19.0, 13.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.850261926651001, -1.7613246440887451, -1.6723873615264893, -1.5834500789642334, -1.4945127964019775, -1.4055755138397217, -1.3166381120681763, -1.2277008295059204, -1.1387635469436646, -1.0498262643814087, -0.9608889818191528, -0.8719516396522522, -0.7830143570899963, -0.6940770745277405, -0.6051397323608398, -0.516202449798584, -0.4272651672363281, -0.33832788467407227, -0.24939057230949402, -0.16045325994491577, -0.07151597738265991, 0.017421305179595947, 0.10635864734649658, 0.19529592990875244, 0.2842332124710083, 0.37317049503326416, 0.4621078073978424, 0.5510451197624207, 0.6399824023246765, 0.7289196848869324, 0.817857027053833, 0.9067943096160889, 0.9957313537597656, 1.0846686363220215, 1.1736059188842773, 1.2625432014465332, 1.351480484008789, 1.440417766571045, 1.5293551683425903, 1.6182924509048462, 1.707229733467102, 1.796167016029358, 1.8851042985916138, 1.9740417003631592, 2.062978982925415, 2.151916265487671, 2.2408535480499268, 2.3297908306121826, 2.4187281131744385, 2.5076653957366943, 2.59660267829895, 2.685539960861206, 2.774477243423462, 2.8634145259857178, 2.9523520469665527, 3.0412893295288086, 3.1302266120910645, 3.2191638946533203, 3.308101177215576, 3.397038459777832, 3.485975742340088, 3.5749130249023438, 3.6638503074645996, 3.7527875900268555, 3.8417248725891113]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 6.0, 2.0, 7.0, 7.0, 13.0, 10.0, 31.0, 27.0, 38.0, 67.0, 105.0, 166.0, 291.0, 501.0, 913.0, 1961.0, 4644.0, 12719.0, 39375.0, 139561.0, 403020.0, 310379.0, 92276.0, 26749.0, 8908.0, 3401.0, 1545.0, 740.0, 413.0, 243.0, 130.0, 89.0, 55.0, 40.0, 32.0, 20.0, 20.0, 13.0, 11.0, 11.0, 2.0, 2.0, 5.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.236328125, -0.22866439819335938, -0.22100067138671875, -0.21333694458007812, -0.2056732177734375, -0.19800949096679688, -0.19034576416015625, -0.18268203735351562, -0.175018310546875, -0.16735458374023438, -0.15969085693359375, -0.15202713012695312, -0.1443634033203125, -0.13669967651367188, -0.12903594970703125, -0.12137222290039062, -0.11370849609375, -0.10604476928710938, -0.09838104248046875, -0.09071731567382812, -0.0830535888671875, -0.07538986206054688, -0.06772613525390625, -0.060062408447265625, -0.052398681640625, -0.044734954833984375, -0.03707122802734375, -0.029407501220703125, -0.0217437744140625, -0.014080047607421875, -0.00641632080078125, 0.001247406005859375, 0.0089111328125, 0.016574859619140625, 0.02423858642578125, 0.031902313232421875, 0.0395660400390625, 0.047229766845703125, 0.05489349365234375, 0.06255722045898438, 0.070220947265625, 0.07788467407226562, 0.08554840087890625, 0.09321212768554688, 0.1008758544921875, 0.10853958129882812, 0.11620330810546875, 0.12386703491210938, 0.13153076171875, 0.13919448852539062, 0.14685821533203125, 0.15452194213867188, 0.1621856689453125, 0.16984939575195312, 0.17751312255859375, 0.18517684936523438, 0.192840576171875, 0.20050430297851562, 0.20816802978515625, 0.21583175659179688, 0.2234954833984375, 0.23115921020507812, 0.23882293701171875, 0.24648666381835938, 0.254150390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 1.0, 5.0, 5.0, 6.0, 3.0, 14.0, 10.0, 22.0, 23.0, 35.0, 44.0, 40.0, 50.0, 62.0, 78.0, 64.0, 63.0, 74.0, 62.0, 73.0, 54.0, 34.0, 53.0, 33.0, 28.0, 17.0, 17.0, 11.0, 8.0, 6.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2406005859375, -0.2329540252685547, -0.22530746459960938, -0.21766090393066406, -0.21001434326171875, -0.20236778259277344, -0.19472122192382812, -0.1870746612548828, -0.1794281005859375, -0.1717815399169922, -0.16413497924804688, -0.15648841857910156, -0.14884185791015625, -0.14119529724121094, -0.13354873657226562, -0.1259021759033203, -0.118255615234375, -0.11060905456542969, -0.10296249389648438, -0.09531593322753906, -0.08766937255859375, -0.08002281188964844, -0.07237625122070312, -0.06472969055175781, -0.0570831298828125, -0.04943656921386719, -0.041790008544921875, -0.03414344787597656, -0.02649688720703125, -0.018850326538085938, -0.011203765869140625, -0.0035572052001953125, 0.00408935546875, 0.011735916137695312, 0.019382476806640625, 0.027029037475585938, 0.03467559814453125, 0.04232215881347656, 0.049968719482421875, 0.05761528015136719, 0.0652618408203125, 0.07290840148925781, 0.08055496215820312, 0.08820152282714844, 0.09584808349609375, 0.10349464416503906, 0.11114120483398438, 0.11878776550292969, 0.126434326171875, 0.1340808868408203, 0.14172744750976562, 0.14937400817871094, 0.15702056884765625, 0.16466712951660156, 0.17231369018554688, 0.1799602508544922, 0.1876068115234375, 0.1952533721923828, 0.20289993286132812, 0.21054649353027344, 0.21819305419921875, 0.22583961486816406, 0.23348617553710938, 0.2411327362060547, 0.248779296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 9.0, 8.0, 13.0, 24.0, 22.0, 42.0, 55.0, 81.0, 117.0, 187.0, 279.0, 404.0, 693.0, 1377.0, 3635.0, 28068.0, 827793.0, 172358.0, 8675.0, 2134.0, 1015.0, 521.0, 341.0, 220.0, 147.0, 119.0, 69.0, 44.0, 28.0, 17.0, 15.0, 14.0, 11.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72509765625, -0.7029647827148438, -0.6808319091796875, -0.6586990356445312, -0.636566162109375, -0.6144332885742188, -0.5923004150390625, -0.5701675415039062, -0.54803466796875, -0.5259017944335938, -0.5037689208984375, -0.48163604736328125, -0.459503173828125, -0.43737030029296875, -0.4152374267578125, -0.39310455322265625, -0.3709716796875, -0.34883880615234375, -0.3267059326171875, -0.30457305908203125, -0.282440185546875, -0.26030731201171875, -0.2381744384765625, -0.21604156494140625, -0.19390869140625, -0.17177581787109375, -0.1496429443359375, -0.12751007080078125, -0.105377197265625, -0.08324432373046875, -0.0611114501953125, -0.03897857666015625, -0.016845703125, 0.00528717041015625, 0.0274200439453125, 0.04955291748046875, 0.071685791015625, 0.09381866455078125, 0.1159515380859375, 0.13808441162109375, 0.16021728515625, 0.18235015869140625, 0.2044830322265625, 0.22661590576171875, 0.248748779296875, 0.27088165283203125, 0.2930145263671875, 0.31514739990234375, 0.3372802734375, 0.35941314697265625, 0.3815460205078125, 0.40367889404296875, 0.425811767578125, 0.44794464111328125, 0.4700775146484375, 0.49221038818359375, 0.51434326171875, 0.5364761352539062, 0.5586090087890625, 0.5807418823242188, 0.602874755859375, 0.6250076293945312, 0.6471405029296875, 0.6692733764648438, 0.69140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 3.0, 5.0, 7.0, 12.0, 14.0, 18.0, 15.0, 19.0, 19.0, 30.0, 19.0, 45.0, 38.0, 36.0, 33.0, 48.0, 48.0, 50.0, 54.0, 44.0, 55.0, 47.0, 39.0, 42.0, 38.0, 34.0, 22.0, 28.0, 22.0, 18.0, 16.0, 10.0, 16.0, 9.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6630859375, -0.6439285278320312, -0.6247711181640625, -0.6056137084960938, -0.586456298828125, -0.5672988891601562, -0.5481414794921875, -0.5289840698242188, -0.50982666015625, -0.49066925048828125, -0.4715118408203125, -0.45235443115234375, -0.433197021484375, -0.41403961181640625, -0.3948822021484375, -0.37572479248046875, -0.3565673828125, -0.33740997314453125, -0.3182525634765625, -0.29909515380859375, -0.279937744140625, -0.26078033447265625, -0.2416229248046875, -0.22246551513671875, -0.20330810546875, -0.18415069580078125, -0.1649932861328125, -0.14583587646484375, -0.126678466796875, -0.10752105712890625, -0.0883636474609375, -0.06920623779296875, -0.050048828125, -0.03089141845703125, -0.0117340087890625, 0.00742340087890625, 0.026580810546875, 0.04573822021484375, 0.0648956298828125, 0.08405303955078125, 0.10321044921875, 0.12236785888671875, 0.1415252685546875, 0.16068267822265625, 0.179840087890625, 0.19899749755859375, 0.2181549072265625, 0.23731231689453125, 0.2564697265625, 0.27562713623046875, 0.2947845458984375, 0.31394195556640625, 0.333099365234375, 0.35225677490234375, 0.3714141845703125, 0.39057159423828125, 0.40972900390625, 0.42888641357421875, 0.4480438232421875, 0.46720123291015625, 0.486358642578125, 0.5055160522460938, 0.5246734619140625, 0.5438308715820312, 0.56298828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 8.0, 4.0, 12.0, 9.0, 7.0, 23.0, 18.0, 22.0, 40.0, 65.0, 83.0, 162.0, 330.0, 885.0, 3623.0, 40757.0, 917753.0, 77554.0, 5220.0, 1115.0, 392.0, 167.0, 91.0, 51.0, 34.0, 26.0, 24.0, 15.0, 15.0, 11.0, 4.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2113037109375, -0.2036457061767578, -0.19598770141601562, -0.18832969665527344, -0.18067169189453125, -0.17301368713378906, -0.16535568237304688, -0.1576976776123047, -0.1500396728515625, -0.1423816680908203, -0.13472366333007812, -0.12706565856933594, -0.11940765380859375, -0.11174964904785156, -0.10409164428710938, -0.09643363952636719, -0.088775634765625, -0.08111763000488281, -0.07345962524414062, -0.06580162048339844, -0.05814361572265625, -0.05048561096191406, -0.042827606201171875, -0.03516960144042969, -0.0275115966796875, -0.019853591918945312, -0.012195587158203125, -0.0045375823974609375, 0.00312042236328125, 0.010778427124023438, 0.018436431884765625, 0.026094436645507812, 0.03375244140625, 0.04141044616699219, 0.049068450927734375, 0.05672645568847656, 0.06438446044921875, 0.07204246520996094, 0.07970046997070312, 0.08735847473144531, 0.0950164794921875, 0.10267448425292969, 0.11033248901367188, 0.11799049377441406, 0.12564849853515625, 0.13330650329589844, 0.14096450805664062, 0.1486225128173828, 0.156280517578125, 0.1639385223388672, 0.17159652709960938, 0.17925453186035156, 0.18691253662109375, 0.19457054138183594, 0.20222854614257812, 0.2098865509033203, 0.2175445556640625, 0.2252025604248047, 0.23286056518554688, 0.24051856994628906, 0.24817657470703125, 0.25583457946777344, 0.2634925842285156, 0.2711505889892578, 0.27880859375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 6.0, 7.0, 14.0, 16.0, 27.0, 35.0, 58.0, 115.0, 182.0, 176.0, 126.0, 54.0, 40.0, 30.0, 23.0, 16.0, 16.0, 5.0, 5.0, 2.0, 5.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011849403381347656, -0.0001147901639342308, -0.00011108629405498505, -0.00010738242417573929, -0.00010367855429649353, -9.997468441724777e-05, -9.627081453800201e-05, -9.256694465875626e-05, -8.88630747795105e-05, -8.515920490026474e-05, -8.145533502101898e-05, -7.775146514177322e-05, -7.404759526252747e-05, -7.034372538328171e-05, -6.663985550403595e-05, -6.293598562479019e-05, -5.9232115745544434e-05, -5.5528245866298676e-05, -5.182437598705292e-05, -4.812050610780716e-05, -4.44166362285614e-05, -4.071276634931564e-05, -3.7008896470069885e-05, -3.330502659082413e-05, -2.960115671157837e-05, -2.589728683233261e-05, -2.2193416953086853e-05, -1.8489547073841095e-05, -1.4785677194595337e-05, -1.1081807315349579e-05, -7.377937436103821e-06, -3.6740675568580627e-06, 2.9802322387695312e-08, 3.7336722016334534e-06, 7.4375420808792114e-06, 1.114141196012497e-05, 1.4845281839370728e-05, 1.8549151718616486e-05, 2.2253021597862244e-05, 2.5956891477108002e-05, 2.966076135635376e-05, 3.336463123559952e-05, 3.7068501114845276e-05, 4.0772370994091034e-05, 4.447624087333679e-05, 4.818011075258255e-05, 5.188398063182831e-05, 5.5587850511074066e-05, 5.9291720390319824e-05, 6.299559026956558e-05, 6.669946014881134e-05, 7.04033300280571e-05, 7.410719990730286e-05, 7.781106978654861e-05, 8.151493966579437e-05, 8.521880954504013e-05, 8.892267942428589e-05, 9.262654930353165e-05, 9.63304191827774e-05, 0.00010003428906202316, 0.00010373815894126892, 0.00010744202882051468, 0.00011114589869976044, 0.0001148497685790062, 0.00011855363845825195]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 1.0, 7.0, 9.0, 13.0, 15.0, 31.0, 54.0, 66.0, 132.0, 209.0, 461.0, 1181.0, 3986.0, 27238.0, 793351.0, 206421.0, 11372.0, 2376.0, 799.0, 380.0, 183.0, 95.0, 61.0, 41.0, 16.0, 16.0, 8.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.16910743713378906, -0.16255569458007812, -0.1560039520263672, -0.14945220947265625, -0.1429004669189453, -0.13634872436523438, -0.12979698181152344, -0.1232452392578125, -0.11669349670410156, -0.11014175415039062, -0.10359001159667969, -0.09703826904296875, -0.09048652648925781, -0.08393478393554688, -0.07738304138183594, -0.070831298828125, -0.06427955627441406, -0.057727813720703125, -0.05117607116699219, -0.04462432861328125, -0.03807258605957031, -0.031520843505859375, -0.024969100952148438, -0.0184173583984375, -0.011865615844726562, -0.005313873291015625, 0.0012378692626953125, 0.00778961181640625, 0.014341354370117188, 0.020893096923828125, 0.027444839477539062, 0.03399658203125, 0.04054832458496094, 0.047100067138671875, 0.05365180969238281, 0.06020355224609375, 0.06675529479980469, 0.07330703735351562, 0.07985877990722656, 0.0864105224609375, 0.09296226501464844, 0.09951400756835938, 0.10606575012207031, 0.11261749267578125, 0.11916923522949219, 0.12572097778320312, 0.13227272033691406, 0.138824462890625, 0.14537620544433594, 0.15192794799804688, 0.1584796905517578, 0.16503143310546875, 0.1715831756591797, 0.17813491821289062, 0.18468666076660156, 0.1912384033203125, 0.19779014587402344, 0.20434188842773438, 0.2108936309814453, 0.21744537353515625, 0.2239971160888672, 0.23054885864257812, 0.23710060119628906, 0.24365234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 4.0, 5.0, 3.0, 5.0, 14.0, 5.0, 22.0, 20.0, 38.0, 39.0, 64.0, 66.0, 73.0, 89.0, 90.0, 79.0, 67.0, 71.0, 42.0, 44.0, 28.0, 31.0, 10.0, 13.0, 5.0, 16.0, 8.0, 9.0, 4.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0], "bins": [-0.1424560546875, -0.13886260986328125, -0.1352691650390625, -0.13167572021484375, -0.128082275390625, -0.12448883056640625, -0.1208953857421875, -0.11730194091796875, -0.11370849609375, -0.11011505126953125, -0.1065216064453125, -0.10292816162109375, -0.099334716796875, -0.09574127197265625, -0.0921478271484375, -0.08855438232421875, -0.0849609375, -0.08136749267578125, -0.0777740478515625, -0.07418060302734375, -0.070587158203125, -0.06699371337890625, -0.0634002685546875, -0.05980682373046875, -0.05621337890625, -0.05261993408203125, -0.0490264892578125, -0.04543304443359375, -0.041839599609375, -0.03824615478515625, -0.0346527099609375, -0.03105926513671875, -0.0274658203125, -0.02387237548828125, -0.0202789306640625, -0.01668548583984375, -0.013092041015625, -0.00949859619140625, -0.0059051513671875, -0.00231170654296875, 0.00128173828125, 0.00487518310546875, 0.0084686279296875, 0.01206207275390625, 0.015655517578125, 0.01924896240234375, 0.0228424072265625, 0.02643585205078125, 0.030029296875, 0.03362274169921875, 0.0372161865234375, 0.04080963134765625, 0.044403076171875, 0.04799652099609375, 0.0515899658203125, 0.05518341064453125, 0.05877685546875, 0.06237030029296875, 0.0659637451171875, 0.06955718994140625, 0.073150634765625, 0.07674407958984375, 0.0803375244140625, 0.08393096923828125, 0.0875244140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 18.0, 80.0, 295.0, 394.0, 114.0, 34.0, 22.0, 11.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9648702144622803, -1.7874879837036133, -1.6101056337356567, -1.4327232837677002, -1.2553410530090332, -1.0779588222503662, -0.9005764722824097, -0.7231941223144531, -0.5458118915557861, -0.36842960119247437, -0.1910473108291626, -0.01366502046585083, 0.16371726989746094, 0.3410995602607727, 0.5184818506240845, 0.695864200592041, 0.873246431350708, 1.050628662109375, 1.2280110120773315, 1.405393362045288, 1.582775592803955, 1.760157823562622, 1.9375401735305786, 2.114922523498535, 2.292304754257202, 2.469686985015869, 2.6470694541931152, 2.8244516849517822, 3.001833915710449, 3.179216146469116, 3.356598377227783, 3.5339808464050293, 3.711362838745117, 3.888745069503784, 4.066127300262451, 4.243509769439697, 4.420891761779785, 4.598274230957031, 4.775656700134277, 4.953039169311523, 5.130421161651611, 5.307803630828857, 5.485185623168945, 5.662568092346191, 5.8399505615234375, 6.017332553863525, 6.1947150230407715, 6.372097015380859, 6.5494794845581055, 6.726861953735352, 6.9042439460754395, 7.0816264152526855, 7.259008407592773, 7.4363908767700195, 7.613773345947266, 7.791155815124512, 7.9685378074646, 8.145919799804688, 8.323302268981934, 8.50068473815918, 8.678067207336426, 8.855449676513672, 9.032831192016602, 9.210213661193848, 9.387596130371094]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 5.0, 6.0, 2.0, 3.0, 5.0, 11.0, 12.0, 15.0, 15.0, 8.0, 21.0, 23.0, 14.0, 23.0, 21.0, 34.0, 21.0, 29.0, 29.0, 33.0, 52.0, 68.0, 58.0, 55.0, 60.0, 34.0, 53.0, 44.0, 24.0, 22.0, 28.0, 20.0, 25.0, 21.0, 17.0, 12.0, 13.0, 10.0, 9.0, 6.0, 9.0, 6.0, 8.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.0536327362060547, -1.9866238832473755, -1.9196151494979858, -1.8526062965393066, -1.785597562789917, -1.7185887098312378, -1.6515798568725586, -1.584571123123169, -1.5175623893737793, -1.4505535364151, -1.3835448026657104, -1.3165359497070312, -1.2495272159576416, -1.1825183629989624, -1.1155095100402832, -1.0485007762908936, -0.9814919233322144, -0.9144831299781799, -0.8474743366241455, -0.7804654836654663, -0.7134567499160767, -0.6464478969573975, -0.579439103603363, -0.5124303102493286, -0.4454215168952942, -0.37841272354125977, -0.31140393018722534, -0.24439510703086853, -0.1773863136768341, -0.11037752032279968, -0.04336869716644287, 0.023640096187591553, 0.09064888954162598, 0.1576576828956604, 0.22466649115085602, 0.29167529940605164, 0.35868409276008606, 0.4256928861141205, 0.4927017092704773, 0.5597105026245117, 0.6267192959785461, 0.6937280893325806, 0.760736882686615, 0.8277456760406494, 0.8947545289993286, 0.9617632627487183, 1.0287721157073975, 1.095780849456787, 1.1627897024154663, 1.2297985553741455, 1.2968072891235352, 1.3638161420822144, 1.430824875831604, 1.4978337287902832, 1.5648424625396729, 1.631851315498352, 1.6988601684570312, 1.7658690214157104, 1.8328777551651, 1.8998866081237793, 1.966895341873169, 2.0339040756225586, 2.1009130477905273, 2.167921781539917, 2.2349305152893066]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 11.0, 18.0, 29.0, 49.0, 83.0, 198.0, 473.0, 1685.0, 12565.0, 685095.0, 3442515.0, 47180.0, 3140.0, 677.0, 276.0, 145.0, 71.0, 34.0, 23.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6435546875, -0.6283111572265625, -0.613067626953125, -0.5978240966796875, -0.58258056640625, -0.5673370361328125, -0.552093505859375, -0.5368499755859375, -0.5216064453125, -0.5063629150390625, -0.491119384765625, -0.4758758544921875, -0.46063232421875, -0.4453887939453125, -0.430145263671875, -0.4149017333984375, -0.399658203125, -0.3844146728515625, -0.369171142578125, -0.3539276123046875, -0.33868408203125, -0.3234405517578125, -0.308197021484375, -0.2929534912109375, -0.2777099609375, -0.2624664306640625, -0.247222900390625, -0.2319793701171875, -0.21673583984375, -0.2014923095703125, -0.186248779296875, -0.1710052490234375, -0.15576171875, -0.1405181884765625, -0.125274658203125, -0.1100311279296875, -0.09478759765625, -0.0795440673828125, -0.064300537109375, -0.0490570068359375, -0.0338134765625, -0.0185699462890625, -0.003326416015625, 0.0119171142578125, 0.02716064453125, 0.0424041748046875, 0.057647705078125, 0.0728912353515625, 0.088134765625, 0.1033782958984375, 0.118621826171875, 0.1338653564453125, 0.14910888671875, 0.1643524169921875, 0.179595947265625, 0.1948394775390625, 0.2100830078125, 0.2253265380859375, 0.240570068359375, 0.2558135986328125, 0.27105712890625, 0.2863006591796875, 0.301544189453125, 0.3167877197265625, 0.33203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 11.0, 13.0, 8.0, 13.0, 30.0, 39.0, 44.0, 43.0, 60.0, 61.0, 74.0, 75.0, 74.0, 58.0, 74.0, 65.0, 45.0, 49.0, 37.0, 38.0, 25.0, 22.0, 10.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.23218345642089844, -0.22449874877929688, -0.2168140411376953, -0.20912933349609375, -0.2014446258544922, -0.19375991821289062, -0.18607521057128906, -0.1783905029296875, -0.17070579528808594, -0.16302108764648438, -0.1553363800048828, -0.14765167236328125, -0.1399669647216797, -0.13228225708007812, -0.12459754943847656, -0.116912841796875, -0.10922813415527344, -0.10154342651367188, -0.09385871887207031, -0.08617401123046875, -0.07848930358886719, -0.07080459594726562, -0.06311988830566406, -0.0554351806640625, -0.04775047302246094, -0.040065765380859375, -0.03238105773925781, -0.02469635009765625, -0.017011642456054688, -0.009326934814453125, -0.0016422271728515625, 0.00604248046875, 0.013727188110351562, 0.021411895751953125, 0.029096603393554688, 0.03678131103515625, 0.04446601867675781, 0.052150726318359375, 0.05983543395996094, 0.0675201416015625, 0.07520484924316406, 0.08288955688476562, 0.09057426452636719, 0.09825897216796875, 0.10594367980957031, 0.11362838745117188, 0.12131309509277344, 0.128997802734375, 0.13668251037597656, 0.14436721801757812, 0.1520519256591797, 0.15973663330078125, 0.1674213409423828, 0.17510604858398438, 0.18279075622558594, 0.1904754638671875, 0.19816017150878906, 0.20584487915039062, 0.2135295867919922, 0.22121429443359375, 0.2288990020751953, 0.23658370971679688, 0.24426841735839844, 0.251953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 15.0, 28.0, 38.0, 77.0, 187.0, 470.0, 1185.0, 3411.0, 23994.0, 4034642.0, 123343.0, 4695.0, 1259.0, 461.0, 238.0, 115.0, 53.0, 18.0, 21.0, 12.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6123046875, -0.5884628295898438, -0.5646209716796875, -0.5407791137695312, -0.516937255859375, -0.49309539794921875, -0.4692535400390625, -0.44541168212890625, -0.42156982421875, -0.39772796630859375, -0.3738861083984375, -0.35004425048828125, -0.326202392578125, -0.30236053466796875, -0.2785186767578125, -0.25467681884765625, -0.2308349609375, -0.20699310302734375, -0.1831512451171875, -0.15930938720703125, -0.135467529296875, -0.11162567138671875, -0.0877838134765625, -0.06394195556640625, -0.04010009765625, -0.01625823974609375, 0.0075836181640625, 0.03142547607421875, 0.055267333984375, 0.07910919189453125, 0.1029510498046875, 0.12679290771484375, 0.150634765625, 0.17447662353515625, 0.1983184814453125, 0.22216033935546875, 0.246002197265625, 0.26984405517578125, 0.2936859130859375, 0.31752777099609375, 0.34136962890625, 0.36521148681640625, 0.3890533447265625, 0.41289520263671875, 0.436737060546875, 0.46057891845703125, 0.4844207763671875, 0.5082626342773438, 0.5321044921875, 0.5559463500976562, 0.5797882080078125, 0.6036300659179688, 0.627471923828125, 0.6513137817382812, 0.6751556396484375, 0.6989974975585938, 0.72283935546875, 0.7466812133789062, 0.7705230712890625, 0.7943649291992188, 0.818206787109375, 0.8420486450195312, 0.8658905029296875, 0.8897323608398438, 0.91357421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 6.0, 31.0, 48.0, 98.0, 359.0, 1109.0, 1496.0, 604.0, 163.0, 70.0, 33.0, 13.0, 11.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7109375, -0.6901702880859375, -0.669403076171875, -0.6486358642578125, -0.62786865234375, -0.6071014404296875, -0.586334228515625, -0.5655670166015625, -0.5447998046875, -0.5240325927734375, -0.503265380859375, -0.4824981689453125, -0.46173095703125, -0.4409637451171875, -0.420196533203125, -0.3994293212890625, -0.378662109375, -0.3578948974609375, -0.337127685546875, -0.3163604736328125, -0.29559326171875, -0.2748260498046875, -0.254058837890625, -0.2332916259765625, -0.2125244140625, -0.1917572021484375, -0.170989990234375, -0.1502227783203125, -0.12945556640625, -0.1086883544921875, -0.087921142578125, -0.0671539306640625, -0.04638671875, -0.0256195068359375, -0.004852294921875, 0.0159149169921875, 0.03668212890625, 0.0574493408203125, 0.078216552734375, 0.0989837646484375, 0.1197509765625, 0.1405181884765625, 0.161285400390625, 0.1820526123046875, 0.20281982421875, 0.2235870361328125, 0.244354248046875, 0.2651214599609375, 0.285888671875, 0.3066558837890625, 0.327423095703125, 0.3481903076171875, 0.36895751953125, 0.3897247314453125, 0.410491943359375, 0.4312591552734375, 0.4520263671875, 0.4727935791015625, 0.493560791015625, 0.5143280029296875, 0.53509521484375, 0.5558624267578125, 0.576629638671875, 0.5973968505859375, 0.6181640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 1.0, 4.0, 9.0, 24.0, 122.0, 507.0, 268.0, 42.0, 6.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.73887825012207, -8.506672859191895, -8.274467468261719, -8.042261123657227, -7.810055732727051, -7.577850341796875, -7.345644950866699, -7.113439083099365, -6.881233215332031, -6.6490278244018555, -6.4168219566345215, -6.184616565704346, -5.952410697937012, -5.720205307006836, -5.48799991607666, -5.255794048309326, -5.02358865737915, -4.791383266448975, -4.559177398681641, -4.326972007751465, -4.094766139984131, -3.862560749053955, -3.6303551197052, -3.3981494903564453, -3.1659438610076904, -2.9337382316589355, -2.7015326023101807, -2.469326972961426, -2.23712158203125, -2.004915714263916, -1.7727103233337402, -1.5405046939849854, -1.3082990646362305, -1.0760934352874756, -0.8438878655433655, -0.6116822957992554, -0.3794766664505005, -0.1472710371017456, 0.08493447303771973, 0.3171401023864746, 0.5493457317352295, 0.7815513610839844, 1.0137569904327393, 1.2459625005722046, 1.4781681299209595, 1.7103737592697144, 1.9425792694091797, 2.1747848987579346, 2.4069905281066895, 2.6391961574554443, 2.871401786804199, 3.103607177734375, 3.335813045501709, 3.5680184364318848, 3.8002240657806396, 4.0324296951293945, 4.26463508605957, 4.496840476989746, 4.72904634475708, 4.961251735687256, 5.19345760345459, 5.425662994384766, 5.657868385314941, 5.890074253082275, 6.122280120849609]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 14.0, 16.0, 30.0, 67.0, 79.0, 87.0, 136.0, 142.0, 124.0, 109.0, 88.0, 51.0, 31.0, 11.0, 8.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.660445213317871, -3.5347414016723633, -3.4090375900268555, -3.2833337783813477, -3.1576297283172607, -3.031925916671753, -2.906222105026245, -2.7805182933807373, -2.6548142433166504, -2.5291104316711426, -2.4034066200256348, -2.277702808380127, -2.15199875831604, -2.0262949466705322, -1.9005911350250244, -1.7748873233795166, -1.6491835117340088, -1.523479700088501, -1.3977757692337036, -1.2720719575881958, -1.1463680267333984, -1.0206642150878906, -0.8949604034423828, -0.7692565321922302, -0.6435526609420776, -0.517848789691925, -0.39214494824409485, -0.26644110679626465, -0.14073723554611206, -0.015033364295959473, 0.11067044734954834, 0.23637431859970093, 0.3620781898498535, 0.4877820611000061, 0.6134859323501587, 0.7391897439956665, 0.8648936152458191, 0.9905974864959717, 1.1163012981414795, 1.2420051097869873, 1.3677090406417847, 1.4934128522872925, 1.6191167831420898, 1.7448205947875977, 1.8705244064331055, 1.9962283372879028, 2.121932029724121, 2.247636079788208, 2.373339891433716, 2.4990437030792236, 2.6247475147247314, 2.7504515647888184, 2.876155376434326, 3.001859188079834, 3.127562999725342, 3.2532668113708496, 3.3789706230163574, 3.5046744346618652, 3.630378246307373, 3.756082057952881, 3.8817861080169678, 4.007490158081055, 4.1331939697265625, 4.25889778137207, 4.384601593017578]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 1.0, 6.0, 10.0, 11.0, 20.0, 19.0, 32.0, 55.0, 83.0, 142.0, 297.0, 604.0, 1427.0, 4283.0, 19119.0, 140198.0, 654690.0, 194959.0, 24338.0, 5226.0, 1649.0, 636.0, 301.0, 160.0, 96.0, 42.0, 50.0, 17.0, 20.0, 13.0, 8.0, 10.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.43310546875, -0.4205780029296875, -0.408050537109375, -0.3955230712890625, -0.38299560546875, -0.3704681396484375, -0.357940673828125, -0.3454132080078125, -0.3328857421875, -0.3203582763671875, -0.307830810546875, -0.2953033447265625, -0.28277587890625, -0.2702484130859375, -0.257720947265625, -0.2451934814453125, -0.232666015625, -0.2201385498046875, -0.207611083984375, -0.1950836181640625, -0.18255615234375, -0.1700286865234375, -0.157501220703125, -0.1449737548828125, -0.1324462890625, -0.1199188232421875, -0.107391357421875, -0.0948638916015625, -0.08233642578125, -0.0698089599609375, -0.057281494140625, -0.0447540283203125, -0.0322265625, -0.0196990966796875, -0.007171630859375, 0.0053558349609375, 0.01788330078125, 0.0304107666015625, 0.042938232421875, 0.0554656982421875, 0.0679931640625, 0.0805206298828125, 0.093048095703125, 0.1055755615234375, 0.11810302734375, 0.1306304931640625, 0.143157958984375, 0.1556854248046875, 0.168212890625, 0.1807403564453125, 0.193267822265625, 0.2057952880859375, 0.21832275390625, 0.2308502197265625, 0.243377685546875, 0.2559051513671875, 0.2684326171875, 0.2809600830078125, 0.293487548828125, 0.3060150146484375, 0.31854248046875, 0.3310699462890625, 0.343597412109375, 0.3561248779296875, 0.36865234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 12.0, 5.0, 10.0, 12.0, 18.0, 37.0, 25.0, 36.0, 43.0, 65.0, 63.0, 74.0, 80.0, 64.0, 70.0, 66.0, 75.0, 59.0, 32.0, 41.0, 30.0, 16.0, 21.0, 14.0, 15.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.239013671875, -0.2313690185546875, -0.223724365234375, -0.2160797119140625, -0.20843505859375, -0.2007904052734375, -0.193145751953125, -0.1855010986328125, -0.1778564453125, -0.1702117919921875, -0.162567138671875, -0.1549224853515625, -0.14727783203125, -0.1396331787109375, -0.131988525390625, -0.1243438720703125, -0.11669921875, -0.1090545654296875, -0.101409912109375, -0.0937652587890625, -0.08612060546875, -0.0784759521484375, -0.070831298828125, -0.0631866455078125, -0.0555419921875, -0.0478973388671875, -0.040252685546875, -0.0326080322265625, -0.02496337890625, -0.0173187255859375, -0.009674072265625, -0.0020294189453125, 0.005615234375, 0.0132598876953125, 0.020904541015625, 0.0285491943359375, 0.03619384765625, 0.0438385009765625, 0.051483154296875, 0.0591278076171875, 0.0667724609375, 0.0744171142578125, 0.082061767578125, 0.0897064208984375, 0.09735107421875, 0.1049957275390625, 0.112640380859375, 0.1202850341796875, 0.1279296875, 0.1355743408203125, 0.143218994140625, 0.1508636474609375, 0.15850830078125, 0.1661529541015625, 0.173797607421875, 0.1814422607421875, 0.1890869140625, 0.1967315673828125, 0.204376220703125, 0.2120208740234375, 0.21966552734375, 0.2273101806640625, 0.234954833984375, 0.2425994873046875, 0.250244140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 7.0, 16.0, 20.0, 16.0, 33.0, 44.0, 34.0, 76.0, 87.0, 145.0, 208.0, 411.0, 783.0, 2085.0, 8423.0, 52166.0, 573892.0, 356924.0, 42392.0, 7123.0, 1879.0, 708.0, 344.0, 202.0, 150.0, 98.0, 66.0, 61.0, 31.0, 19.0, 20.0, 18.0, 17.0, 13.0, 6.0, 6.0, 6.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.33544921875, -0.3230018615722656, -0.31055450439453125, -0.2981071472167969, -0.2856597900390625, -0.2732124328613281, -0.26076507568359375, -0.24831771850585938, -0.235870361328125, -0.22342300415039062, -0.21097564697265625, -0.19852828979492188, -0.1860809326171875, -0.17363357543945312, -0.16118621826171875, -0.14873886108398438, -0.13629150390625, -0.12384414672851562, -0.11139678955078125, -0.09894943237304688, -0.0865020751953125, -0.07405471801757812, -0.06160736083984375, -0.049160003662109375, -0.036712646484375, -0.024265289306640625, -0.01181793212890625, 0.000629425048828125, 0.0130767822265625, 0.025524139404296875, 0.03797149658203125, 0.050418853759765625, 0.0628662109375, 0.07531356811523438, 0.08776092529296875, 0.10020828247070312, 0.1126556396484375, 0.12510299682617188, 0.13755035400390625, 0.14999771118164062, 0.162445068359375, 0.17489242553710938, 0.18733978271484375, 0.19978713989257812, 0.2122344970703125, 0.22468185424804688, 0.23712921142578125, 0.24957656860351562, 0.26202392578125, 0.2744712829589844, 0.28691864013671875, 0.2993659973144531, 0.3118133544921875, 0.3242607116699219, 0.33670806884765625, 0.3491554260253906, 0.361602783203125, 0.3740501403808594, 0.38649749755859375, 0.3989448547363281, 0.4113922119140625, 0.4238395690917969, 0.43628692626953125, 0.4487342834472656, 0.461181640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 8.0, 6.0, 5.0, 9.0, 4.0, 7.0, 6.0, 18.0, 9.0, 14.0, 15.0, 14.0, 23.0, 36.0, 29.0, 32.0, 43.0, 38.0, 47.0, 51.0, 51.0, 49.0, 49.0, 34.0, 42.0, 35.0, 35.0, 40.0, 38.0, 29.0, 29.0, 18.0, 31.0, 19.0, 19.0, 11.0, 13.0, 10.0, 7.0, 8.0, 4.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444091796875, -0.4276390075683594, -0.41118621826171875, -0.3947334289550781, -0.3782806396484375, -0.3618278503417969, -0.34537506103515625, -0.3289222717285156, -0.312469482421875, -0.2960166931152344, -0.27956390380859375, -0.2631111145019531, -0.2466583251953125, -0.23020553588867188, -0.21375274658203125, -0.19729995727539062, -0.18084716796875, -0.16439437866210938, -0.14794158935546875, -0.13148880004882812, -0.1150360107421875, -0.09858322143554688, -0.08213043212890625, -0.06567764282226562, -0.049224853515625, -0.032772064208984375, -0.01631927490234375, 0.000133514404296875, 0.0165863037109375, 0.033039093017578125, 0.04949188232421875, 0.06594467163085938, 0.0823974609375, 0.09885025024414062, 0.11530303955078125, 0.13175582885742188, 0.1482086181640625, 0.16466140747070312, 0.18111419677734375, 0.19756698608398438, 0.214019775390625, 0.23047256469726562, 0.24692535400390625, 0.2633781433105469, 0.2798309326171875, 0.2962837219238281, 0.31273651123046875, 0.3291893005371094, 0.34564208984375, 0.3620948791503906, 0.37854766845703125, 0.3950004577636719, 0.4114532470703125, 0.4279060363769531, 0.44435882568359375, 0.4608116149902344, 0.477264404296875, 0.4937171936035156, 0.5101699829101562, 0.5266227722167969, 0.5430755615234375, 0.5595283508300781, 0.5759811401367188, 0.5924339294433594, 0.60888671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 12.0, 15.0, 31.0, 44.0, 70.0, 143.0, 304.0, 997.0, 4611.0, 30459.0, 554426.0, 421533.0, 29786.0, 4446.0, 1005.0, 338.0, 143.0, 75.0, 36.0, 23.0, 13.0, 7.0, 8.0, 1.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.18947124481201172, -0.18448448181152344, -0.17949771881103516, -0.17451095581054688, -0.1695241928100586, -0.1645374298095703, -0.15955066680908203, -0.15456390380859375, -0.14957714080810547, -0.1445903778076172, -0.1396036148071289, -0.13461685180664062, -0.12963008880615234, -0.12464332580566406, -0.11965656280517578, -0.1146697998046875, -0.10968303680419922, -0.10469627380371094, -0.09970951080322266, -0.09472274780273438, -0.0897359848022461, -0.08474922180175781, -0.07976245880126953, -0.07477569580078125, -0.06978893280029297, -0.06480216979980469, -0.059815406799316406, -0.054828643798828125, -0.049841880798339844, -0.04485511779785156, -0.03986835479736328, -0.034881591796875, -0.02989482879638672, -0.024908065795898438, -0.019921302795410156, -0.014934539794921875, -0.009947776794433594, -0.0049610137939453125, 2.574920654296875e-05, 0.00501251220703125, 0.009999275207519531, 0.014986038208007812, 0.019972801208496094, 0.024959564208984375, 0.029946327209472656, 0.03493309020996094, 0.03991985321044922, 0.0449066162109375, 0.04989337921142578, 0.05488014221191406, 0.059866905212402344, 0.06485366821289062, 0.0698404312133789, 0.07482719421386719, 0.07981395721435547, 0.08480072021484375, 0.08978748321533203, 0.09477424621582031, 0.0997610092163086, 0.10474777221679688, 0.10973453521728516, 0.11472129821777344, 0.11970806121826172, 0.12469482421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 2.0, 14.0, 17.0, 29.0, 50.0, 60.0, 91.0, 125.0, 137.0, 124.0, 124.0, 70.0, 52.0, 33.0, 25.0, 9.0, 12.0, 5.0, 1.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23464584350586e-05, -6.009731441736221e-05, -5.784817039966583e-05, -5.559902638196945e-05, -5.334988236427307e-05, -5.110073834657669e-05, -4.885159432888031e-05, -4.660245031118393e-05, -4.435330629348755e-05, -4.210416227579117e-05, -3.985501825809479e-05, -3.760587424039841e-05, -3.5356730222702026e-05, -3.3107586205005646e-05, -3.0858442187309265e-05, -2.8609298169612885e-05, -2.6360154151916504e-05, -2.4111010134220123e-05, -2.1861866116523743e-05, -1.9612722098827362e-05, -1.736357808113098e-05, -1.51144340634346e-05, -1.286529004573822e-05, -1.061614602804184e-05, -8.367002010345459e-06, -6.117857992649078e-06, -3.868713974952698e-06, -1.6195699572563171e-06, 6.295740604400635e-07, 2.878718078136444e-06, 5.127862095832825e-06, 7.377006113529205e-06, 9.626150131225586e-06, 1.1875294148921967e-05, 1.4124438166618347e-05, 1.6373582184314728e-05, 1.862272620201111e-05, 2.087187021970749e-05, 2.312101423740387e-05, 2.537015825510025e-05, 2.761930227279663e-05, 2.986844629049301e-05, 3.211759030818939e-05, 3.436673432588577e-05, 3.661587834358215e-05, 3.8865022361278534e-05, 4.1114166378974915e-05, 4.3363310396671295e-05, 4.5612454414367676e-05, 4.7861598432064056e-05, 5.011074244976044e-05, 5.235988646745682e-05, 5.46090304851532e-05, 5.685817450284958e-05, 5.910731852054596e-05, 6.135646253824234e-05, 6.360560655593872e-05, 6.58547505736351e-05, 6.810389459133148e-05, 7.035303860902786e-05, 7.260218262672424e-05, 7.485132664442062e-05, 7.7100470662117e-05, 7.934961467981339e-05, 8.159875869750977e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 15.0, 16.0, 20.0, 43.0, 80.0, 130.0, 264.0, 775.0, 2737.0, 14508.0, 140450.0, 792281.0, 84067.0, 10035.0, 2004.0, 582.0, 251.0, 104.0, 68.0, 43.0, 26.0, 12.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2022705078125, -0.19738483428955078, -0.19249916076660156, -0.18761348724365234, -0.18272781372070312, -0.1778421401977539, -0.1729564666748047, -0.16807079315185547, -0.16318511962890625, -0.15829944610595703, -0.1534137725830078, -0.1485280990600586, -0.14364242553710938, -0.13875675201416016, -0.13387107849121094, -0.12898540496826172, -0.1240997314453125, -0.11921405792236328, -0.11432838439941406, -0.10944271087646484, -0.10455703735351562, -0.0996713638305664, -0.09478569030761719, -0.08990001678466797, -0.08501434326171875, -0.08012866973876953, -0.07524299621582031, -0.0703573226928711, -0.06547164916992188, -0.060585975646972656, -0.05570030212402344, -0.05081462860107422, -0.045928955078125, -0.04104328155517578, -0.03615760803222656, -0.031271934509277344, -0.026386260986328125, -0.021500587463378906, -0.016614913940429688, -0.011729240417480469, -0.00684356689453125, -0.0019578933715820312, 0.0029277801513671875, 0.007813453674316406, 0.012699127197265625, 0.017584800720214844, 0.022470474243164062, 0.02735614776611328, 0.0322418212890625, 0.03712749481201172, 0.04201316833496094, 0.046898841857910156, 0.051784515380859375, 0.056670188903808594, 0.06155586242675781, 0.06644153594970703, 0.07132720947265625, 0.07621288299560547, 0.08109855651855469, 0.0859842300415039, 0.09086990356445312, 0.09575557708740234, 0.10064125061035156, 0.10552692413330078, 0.11041259765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 8.0, 5.0, 3.0, 9.0, 14.0, 19.0, 27.0, 51.0, 56.0, 82.0, 84.0, 109.0, 133.0, 96.0, 91.0, 59.0, 32.0, 33.0, 36.0, 20.0, 11.0, 8.0, 11.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134033203125, -0.12943267822265625, -0.1248321533203125, -0.12023162841796875, -0.115631103515625, -0.11103057861328125, -0.1064300537109375, -0.10182952880859375, -0.09722900390625, -0.09262847900390625, -0.0880279541015625, -0.08342742919921875, -0.078826904296875, -0.07422637939453125, -0.0696258544921875, -0.06502532958984375, -0.0604248046875, -0.05582427978515625, -0.0512237548828125, -0.04662322998046875, -0.042022705078125, -0.03742218017578125, -0.0328216552734375, -0.02822113037109375, -0.02362060546875, -0.01902008056640625, -0.0144195556640625, -0.00981903076171875, -0.005218505859375, -0.00061798095703125, 0.0039825439453125, 0.00858306884765625, 0.01318359375, 0.01778411865234375, 0.0223846435546875, 0.02698516845703125, 0.031585693359375, 0.03618621826171875, 0.0407867431640625, 0.04538726806640625, 0.04998779296875, 0.05458831787109375, 0.0591888427734375, 0.06378936767578125, 0.068389892578125, 0.07299041748046875, 0.0775909423828125, 0.08219146728515625, 0.0867919921875, 0.09139251708984375, 0.0959930419921875, 0.10059356689453125, 0.105194091796875, 0.10979461669921875, 0.1143951416015625, 0.11899566650390625, 0.12359619140625, 0.12819671630859375, 0.1327972412109375, 0.13739776611328125, 0.141998291015625, 0.14659881591796875, 0.1511993408203125, 0.15579986572265625, 0.160400390625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 5.0, 14.0, 41.0, 119.0, 313.0, 374.0, 82.0, 26.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.067654132843018, -6.907448768615723, -6.747243881225586, -6.587038516998291, -6.426833152770996, -6.266628265380859, -6.1064229011535645, -5.9462175369262695, -5.786012649536133, -5.625807285308838, -5.465602397918701, -5.305397033691406, -5.1451921463012695, -4.984986782073975, -4.82478141784668, -4.664576530456543, -4.504371166229248, -4.344165802001953, -4.183960914611816, -4.0237555503845215, -3.8635504245758057, -3.70334529876709, -3.543139934539795, -3.382934808731079, -3.2227296829223633, -3.0625245571136475, -2.9023194313049316, -2.7421140670776367, -2.581908941268921, -2.421703815460205, -2.26149845123291, -2.1012933254241943, -1.9410877227783203, -1.7808825969696045, -1.6206773519515991, -1.4604721069335938, -1.300266981124878, -1.140061855316162, -0.9798566102981567, -0.8196513652801514, -0.6594462394714355, -0.49924105405807495, -0.33903586864471436, -0.17883068323135376, -0.018625497817993164, 0.14157968759536743, 0.301784873008728, 0.4619901180267334, 0.6221952438354492, 0.7824004292488098, 0.9426056146621704, 1.1028108596801758, 1.2630159854888916, 1.4232211112976074, 1.5834263563156128, 1.7436316013336182, 1.903836727142334, 2.06404185295105, 2.2242469787597656, 2.3844523429870605, 2.5446574687957764, 2.704862594604492, 2.865067958831787, 3.025273084640503, 3.1854782104492188]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 7.0, 8.0, 11.0, 9.0, 7.0, 18.0, 24.0, 18.0, 12.0, 31.0, 28.0, 29.0, 35.0, 28.0, 35.0, 58.0, 62.0, 81.0, 78.0, 54.0, 42.0, 42.0, 24.0, 33.0, 27.0, 35.0, 26.0, 22.0, 16.0, 17.0, 12.0, 17.0, 10.0, 6.0, 7.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9093279838562012, -1.8437790870666504, -1.7782301902770996, -1.7126811742782593, -1.6471322774887085, -1.5815833806991577, -1.5160343647003174, -1.4504854679107666, -1.3849365711212158, -1.319387674331665, -1.2538387775421143, -1.188289761543274, -1.1227408647537231, -1.0571919679641724, -0.9916430115699768, -0.9260940551757812, -0.8605451583862305, -0.7949962615966797, -0.7294473052024841, -0.6638983488082886, -0.5983494520187378, -0.532800555229187, -0.46725159883499146, -0.4017026722431183, -0.3361537456512451, -0.27060481905937195, -0.20505589246749878, -0.1395069658756256, -0.07395803928375244, -0.008409112691879272, 0.057139813899993896, 0.12268874049186707, 0.18823742866516113, 0.2537863552570343, 0.31933528184890747, 0.38488420844078064, 0.4504331350326538, 0.5159820318222046, 0.5815309882164001, 0.6470799446105957, 0.7126288414001465, 0.7781777381896973, 0.8437266945838928, 0.9092756509780884, 0.9748245477676392, 1.04037344455719, 1.1059224605560303, 1.171471357345581, 1.2370202541351318, 1.3025691509246826, 1.3681180477142334, 1.4336670637130737, 1.4992159605026245, 1.5647648572921753, 1.6303138732910156, 1.6958627700805664, 1.7614116668701172, 1.826960563659668, 1.8925094604492188, 1.958058476448059, 2.0236072540283203, 2.08915638923645, 2.154705286026001, 2.2202541828155518, 2.2858030796051025]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 10.0, 5.0, 12.0, 23.0, 35.0, 43.0, 70.0, 142.0, 250.0, 538.0, 1440.0, 4490.0, 19139.0, 192557.0, 2501049.0, 1368568.0, 89454.0, 11532.0, 3000.0, 1032.0, 395.0, 183.0, 110.0, 61.0, 33.0, 26.0, 18.0, 7.0, 11.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.24609375, -0.23836708068847656, -0.23064041137695312, -0.2229137420654297, -0.21518707275390625, -0.2074604034423828, -0.19973373413085938, -0.19200706481933594, -0.1842803955078125, -0.17655372619628906, -0.16882705688476562, -0.1611003875732422, -0.15337371826171875, -0.1456470489501953, -0.13792037963867188, -0.13019371032714844, -0.122467041015625, -0.11474037170410156, -0.10701370239257812, -0.09928703308105469, -0.09156036376953125, -0.08383369445800781, -0.07610702514648438, -0.06838035583496094, -0.0606536865234375, -0.05292701721191406, -0.045200347900390625, -0.03747367858886719, -0.02974700927734375, -0.022020339965820312, -0.014293670654296875, -0.0065670013427734375, 0.00115966796875, 0.008886337280273438, 0.016613006591796875, 0.024339675903320312, 0.03206634521484375, 0.03979301452636719, 0.047519683837890625, 0.05524635314941406, 0.0629730224609375, 0.07069969177246094, 0.07842636108398438, 0.08615303039550781, 0.09387969970703125, 0.10160636901855469, 0.10933303833007812, 0.11705970764160156, 0.124786376953125, 0.13251304626464844, 0.14023971557617188, 0.1479663848876953, 0.15569305419921875, 0.1634197235107422, 0.17114639282226562, 0.17887306213378906, 0.1865997314453125, 0.19432640075683594, 0.20205307006835938, 0.2097797393798828, 0.21750640869140625, 0.2252330780029297, 0.23295974731445312, 0.24068641662597656, 0.2484130859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 6.0, 13.0, 11.0, 18.0, 22.0, 32.0, 40.0, 45.0, 66.0, 55.0, 89.0, 70.0, 71.0, 68.0, 86.0, 64.0, 56.0, 29.0, 34.0, 42.0, 28.0, 13.0, 11.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2464599609375, -0.2388324737548828, -0.23120498657226562, -0.22357749938964844, -0.21595001220703125, -0.20832252502441406, -0.20069503784179688, -0.1930675506591797, -0.1854400634765625, -0.1778125762939453, -0.17018508911132812, -0.16255760192871094, -0.15493011474609375, -0.14730262756347656, -0.13967514038085938, -0.1320476531982422, -0.124420166015625, -0.11679267883300781, -0.10916519165039062, -0.10153770446777344, -0.09391021728515625, -0.08628273010253906, -0.07865524291992188, -0.07102775573730469, -0.0634002685546875, -0.05577278137207031, -0.048145294189453125, -0.04051780700683594, -0.03289031982421875, -0.025262832641601562, -0.017635345458984375, -0.010007858276367188, -0.00238037109375, 0.0052471160888671875, 0.012874603271484375, 0.020502090454101562, 0.02812957763671875, 0.03575706481933594, 0.043384552001953125, 0.05101203918457031, 0.0586395263671875, 0.06626701354980469, 0.07389450073242188, 0.08152198791503906, 0.08914947509765625, 0.09677696228027344, 0.10440444946289062, 0.11203193664550781, 0.119659423828125, 0.1272869110107422, 0.13491439819335938, 0.14254188537597656, 0.15016937255859375, 0.15779685974121094, 0.16542434692382812, 0.1730518341064453, 0.1806793212890625, 0.1883068084716797, 0.19593429565429688, 0.20356178283691406, 0.21118927001953125, 0.21881675720214844, 0.22644424438476562, 0.2340717315673828, 0.24169921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 5.0, 7.0, 7.0, 14.0, 22.0, 35.0, 44.0, 63.0, 107.0, 195.0, 393.0, 851.0, 2787.0, 11995.0, 98028.0, 2926017.0, 1096862.0, 45979.0, 7392.0, 1981.0, 699.0, 344.0, 153.0, 89.0, 61.0, 42.0, 28.0, 20.0, 17.0, 7.0, 9.0, 4.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2646484375, -0.2554740905761719, -0.24629974365234375, -0.23712539672851562, -0.2279510498046875, -0.21877670288085938, -0.20960235595703125, -0.20042800903320312, -0.191253662109375, -0.18207931518554688, -0.17290496826171875, -0.16373062133789062, -0.1545562744140625, -0.14538192749023438, -0.13620758056640625, -0.12703323364257812, -0.11785888671875, -0.10868453979492188, -0.09951019287109375, -0.09033584594726562, -0.0811614990234375, -0.07198715209960938, -0.06281280517578125, -0.053638458251953125, -0.044464111328125, -0.035289764404296875, -0.02611541748046875, -0.016941070556640625, -0.0077667236328125, 0.001407623291015625, 0.01058197021484375, 0.019756317138671875, 0.0289306640625, 0.038105010986328125, 0.04727935791015625, 0.056453704833984375, 0.0656280517578125, 0.07480239868164062, 0.08397674560546875, 0.09315109252929688, 0.102325439453125, 0.11149978637695312, 0.12067413330078125, 0.12984848022460938, 0.1390228271484375, 0.14819717407226562, 0.15737152099609375, 0.16654586791992188, 0.17572021484375, 0.18489456176757812, 0.19406890869140625, 0.20324325561523438, 0.2124176025390625, 0.22159194946289062, 0.23076629638671875, 0.23994064331054688, 0.249114990234375, 0.2582893371582031, 0.26746368408203125, 0.2766380310058594, 0.2858123779296875, 0.2949867248535156, 0.30416107177734375, 0.3133354187011719, 0.322509765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 9.0, 6.0, 10.0, 18.0, 17.0, 28.0, 40.0, 77.0, 105.0, 165.0, 293.0, 426.0, 620.0, 650.0, 567.0, 389.0, 226.0, 140.0, 89.0, 54.0, 27.0, 35.0, 19.0, 18.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.2312297821044922, -0.22307968139648438, -0.21492958068847656, -0.20677947998046875, -0.19862937927246094, -0.19047927856445312, -0.1823291778564453, -0.1741790771484375, -0.1660289764404297, -0.15787887573242188, -0.14972877502441406, -0.14157867431640625, -0.13342857360839844, -0.12527847290039062, -0.11712837219238281, -0.108978271484375, -0.10082817077636719, -0.09267807006835938, -0.08452796936035156, -0.07637786865234375, -0.06822776794433594, -0.060077667236328125, -0.05192756652832031, -0.0437774658203125, -0.03562736511230469, -0.027477264404296875, -0.019327163696289062, -0.01117706298828125, -0.0030269622802734375, 0.005123138427734375, 0.013273239135742188, 0.02142333984375, 0.029573440551757812, 0.037723541259765625, 0.04587364196777344, 0.05402374267578125, 0.06217384338378906, 0.07032394409179688, 0.07847404479980469, 0.0866241455078125, 0.09477424621582031, 0.10292434692382812, 0.11107444763183594, 0.11922454833984375, 0.12737464904785156, 0.13552474975585938, 0.1436748504638672, 0.151824951171875, 0.1599750518798828, 0.16812515258789062, 0.17627525329589844, 0.18442535400390625, 0.19257545471191406, 0.20072555541992188, 0.2088756561279297, 0.2170257568359375, 0.2251758575439453, 0.23332595825195312, 0.24147605895996094, 0.24962615966796875, 0.25777626037597656, 0.2659263610839844, 0.2740764617919922, 0.2822265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 17.0, 18.0, 32.0, 66.0, 111.0, 146.0, 175.0, 161.0, 109.0, 83.0, 34.0, 18.0, 6.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3326082229614258, -1.2683184146881104, -1.204028606414795, -1.1397387981414795, -1.075448989868164, -1.0111591815948486, -0.9468694925308228, -0.8825796842575073, -0.8182898759841919, -0.7540000677108765, -0.689710259437561, -0.6254205107688904, -0.561130702495575, -0.4968408942222595, -0.4325511157512665, -0.36826133728027344, -0.303971529006958, -0.23968173563480377, -0.17539194226264954, -0.1111021488904953, -0.046812355518341064, 0.017477452754974365, 0.08176723122596741, 0.14605700969696045, 0.21034681797027588, 0.2746366262435913, 0.33892640471458435, 0.4032161831855774, 0.4675059914588928, 0.5317957997322083, 0.5960855484008789, 0.6603753566741943, 0.7246651649475098, 0.7889549732208252, 0.8532447814941406, 0.9175345301628113, 0.9818243384361267, 1.046114206314087, 1.1104038953781128, 1.1746937036514282, 1.2389835119247437, 1.303273320198059, 1.3675631284713745, 1.43185293674469, 1.4961426258087158, 1.5604324340820312, 1.6247222423553467, 1.689012050628662, 1.7533018589019775, 1.817591667175293, 1.8818814754486084, 1.9461712837219238, 2.0104610919952393, 2.0747509002685547, 2.13904070854187, 2.2033305168151855, 2.267620086669922, 2.3319098949432373, 2.3961997032165527, 2.460489511489868, 2.5247793197631836, 2.589069128036499, 2.6533589363098145, 2.717648506164551, 2.7819385528564453]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 7.0, 6.0, 6.0, 13.0, 14.0, 20.0, 16.0, 23.0, 28.0, 30.0, 32.0, 49.0, 51.0, 47.0, 49.0, 66.0, 62.0, 60.0, 50.0, 60.0, 41.0, 37.0, 38.0, 43.0, 39.0, 28.0, 21.0, 17.0, 18.0, 13.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.6954822540283203, -1.6533327102661133, -1.6111831665039062, -1.5690336227416992, -1.5268839597702026, -1.4847344160079956, -1.4425848722457886, -1.4004353284835815, -1.358285665512085, -1.316136121749878, -1.273986577987671, -1.2318370342254639, -1.1896873712539673, -1.1475378274917603, -1.1053882837295532, -1.0632387399673462, -1.0210891962051392, -0.9789396524429321, -0.9367900490760803, -0.8946405053138733, -0.8524909019470215, -0.8103413581848145, -0.7681918144226074, -0.7260422706604004, -0.6838926672935486, -0.6417431235313416, -0.5995935201644897, -0.5574439764022827, -0.5152944326400757, -0.4731448292732239, -0.43099528551101685, -0.3888457119464874, -0.346696138381958, -0.3045465648174286, -0.26239699125289917, -0.22024744749069214, -0.17809787392616272, -0.1359483003616333, -0.09379875659942627, -0.05164918303489685, -0.009499609470367432, 0.03264995664358139, 0.07479952275753021, 0.11694908142089844, 0.15909865498542786, 0.20124822854995728, 0.2433977723121643, 0.2855473458766937, 0.32769691944122314, 0.36984649300575256, 0.411996066570282, 0.454145610332489, 0.49629518389701843, 0.5384447574615479, 0.5805943012237549, 0.6227438449859619, 0.6648934483528137, 0.7070429921150208, 0.7491925954818726, 0.7913421392440796, 0.8334916830062866, 0.8756412863731384, 0.9177908301353455, 0.9599404335021973, 1.0020899772644043]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 8.0, 15.0, 23.0, 35.0, 42.0, 107.0, 151.0, 298.0, 597.0, 1639.0, 5855.0, 30378.0, 218258.0, 632949.0, 131852.0, 19857.0, 4093.0, 1249.0, 514.0, 276.0, 156.0, 70.0, 50.0, 28.0, 17.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3946685791015625, -0.383819580078125, -0.3729705810546875, -0.36212158203125, -0.3512725830078125, -0.340423583984375, -0.3295745849609375, -0.3187255859375, -0.3078765869140625, -0.297027587890625, -0.2861785888671875, -0.27532958984375, -0.2644805908203125, -0.253631591796875, -0.2427825927734375, -0.23193359375, -0.2210845947265625, -0.210235595703125, -0.1993865966796875, -0.18853759765625, -0.1776885986328125, -0.166839599609375, -0.1559906005859375, -0.1451416015625, -0.1342926025390625, -0.123443603515625, -0.1125946044921875, -0.10174560546875, -0.0908966064453125, -0.080047607421875, -0.0691986083984375, -0.058349609375, -0.0475006103515625, -0.036651611328125, -0.0258026123046875, -0.01495361328125, -0.0041046142578125, 0.006744384765625, 0.0175933837890625, 0.0284423828125, 0.0392913818359375, 0.050140380859375, 0.0609893798828125, 0.07183837890625, 0.0826873779296875, 0.093536376953125, 0.1043853759765625, 0.115234375, 0.1260833740234375, 0.136932373046875, 0.1477813720703125, 0.15863037109375, 0.1694793701171875, 0.180328369140625, 0.1911773681640625, 0.2020263671875, 0.2128753662109375, 0.223724365234375, 0.2345733642578125, 0.24542236328125, 0.2562713623046875, 0.267120361328125, 0.2779693603515625, 0.288818359375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 10.0, 16.0, 16.0, 24.0, 36.0, 41.0, 56.0, 51.0, 64.0, 74.0, 77.0, 84.0, 63.0, 73.0, 69.0, 53.0, 32.0, 37.0, 32.0, 28.0, 25.0, 13.0, 3.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2481689453125, -0.2405071258544922, -0.23284530639648438, -0.22518348693847656, -0.21752166748046875, -0.20985984802246094, -0.20219802856445312, -0.1945362091064453, -0.1868743896484375, -0.1792125701904297, -0.17155075073242188, -0.16388893127441406, -0.15622711181640625, -0.14856529235839844, -0.14090347290039062, -0.1332416534423828, -0.125579833984375, -0.11791801452636719, -0.11025619506835938, -0.10259437561035156, -0.09493255615234375, -0.08727073669433594, -0.07960891723632812, -0.07194709777832031, -0.0642852783203125, -0.05662345886230469, -0.048961639404296875, -0.04129981994628906, -0.03363800048828125, -0.025976181030273438, -0.018314361572265625, -0.010652542114257812, -0.00299072265625, 0.0046710968017578125, 0.012332916259765625, 0.019994735717773438, 0.02765655517578125, 0.03531837463378906, 0.042980194091796875, 0.05064201354980469, 0.0583038330078125, 0.06596565246582031, 0.07362747192382812, 0.08128929138183594, 0.08895111083984375, 0.09661293029785156, 0.10427474975585938, 0.11193656921386719, 0.119598388671875, 0.1272602081298828, 0.13492202758789062, 0.14258384704589844, 0.15024566650390625, 0.15790748596191406, 0.16556930541992188, 0.1732311248779297, 0.1808929443359375, 0.1885547637939453, 0.19621658325195312, 0.20387840270996094, 0.21154022216796875, 0.21920204162597656, 0.22686386108398438, 0.2345256805419922, 0.2421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 13.0, 12.0, 27.0, 32.0, 40.0, 60.0, 73.0, 83.0, 139.0, 182.0, 260.0, 379.0, 664.0, 1171.0, 3018.0, 14622.0, 134781.0, 787043.0, 89598.0, 10775.0, 2605.0, 1056.0, 569.0, 407.0, 282.0, 166.0, 117.0, 82.0, 62.0, 68.0, 34.0, 27.0, 25.0, 17.0, 13.0, 9.0, 6.0, 3.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.415283203125, -0.40247344970703125, -0.3896636962890625, -0.37685394287109375, -0.364044189453125, -0.35123443603515625, -0.3384246826171875, -0.32561492919921875, -0.31280517578125, -0.29999542236328125, -0.2871856689453125, -0.27437591552734375, -0.261566162109375, -0.24875640869140625, -0.2359466552734375, -0.22313690185546875, -0.2103271484375, -0.19751739501953125, -0.1847076416015625, -0.17189788818359375, -0.159088134765625, -0.14627838134765625, -0.1334686279296875, -0.12065887451171875, -0.10784912109375, -0.09503936767578125, -0.0822296142578125, -0.06941986083984375, -0.056610107421875, -0.04380035400390625, -0.0309906005859375, -0.01818084716796875, -0.00537109375, 0.00743865966796875, 0.0202484130859375, 0.03305816650390625, 0.045867919921875, 0.05867767333984375, 0.0714874267578125, 0.08429718017578125, 0.09710693359375, 0.10991668701171875, 0.1227264404296875, 0.13553619384765625, 0.148345947265625, 0.16115570068359375, 0.1739654541015625, 0.18677520751953125, 0.1995849609375, 0.21239471435546875, 0.2252044677734375, 0.23801422119140625, 0.250823974609375, 0.26363372802734375, 0.2764434814453125, 0.28925323486328125, 0.30206298828125, 0.31487274169921875, 0.3276824951171875, 0.34049224853515625, 0.353302001953125, 0.36611175537109375, 0.3789215087890625, 0.39173126220703125, 0.404541015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 1.0, 3.0, 4.0, 15.0, 5.0, 12.0, 15.0, 15.0, 21.0, 41.0, 22.0, 39.0, 42.0, 57.0, 43.0, 58.0, 66.0, 67.0, 71.0, 63.0, 53.0, 41.0, 40.0, 36.0, 29.0, 35.0, 37.0, 16.0, 9.0, 7.0, 11.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.625, -0.6049728393554688, -0.5849456787109375, -0.5649185180664062, -0.544891357421875, -0.5248641967773438, -0.5048370361328125, -0.48480987548828125, -0.46478271484375, -0.44475555419921875, -0.4247283935546875, -0.40470123291015625, -0.384674072265625, -0.36464691162109375, -0.3446197509765625, -0.32459259033203125, -0.3045654296875, -0.28453826904296875, -0.2645111083984375, -0.24448394775390625, -0.224456787109375, -0.20442962646484375, -0.1844024658203125, -0.16437530517578125, -0.14434814453125, -0.12432098388671875, -0.1042938232421875, -0.08426666259765625, -0.064239501953125, -0.04421234130859375, -0.0241851806640625, -0.00415802001953125, 0.015869140625, 0.03589630126953125, 0.0559234619140625, 0.07595062255859375, 0.095977783203125, 0.11600494384765625, 0.1360321044921875, 0.15605926513671875, 0.17608642578125, 0.19611358642578125, 0.2161407470703125, 0.23616790771484375, 0.256195068359375, 0.27622222900390625, 0.2962493896484375, 0.31627655029296875, 0.3363037109375, 0.35633087158203125, 0.3763580322265625, 0.39638519287109375, 0.416412353515625, 0.43643951416015625, 0.4564666748046875, 0.47649383544921875, 0.49652099609375, 0.5165481567382812, 0.5365753173828125, 0.5566024780273438, 0.576629638671875, 0.5966567993164062, 0.6166839599609375, 0.6367111206054688, 0.65673828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 16.0, 28.0, 44.0, 62.0, 163.0, 287.0, 821.0, 2963.0, 16922.0, 191790.0, 786343.0, 41169.0, 5681.0, 1324.0, 463.0, 207.0, 98.0, 62.0, 30.0, 15.0, 15.0, 8.0, 8.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1942138671875, -0.18938350677490234, -0.1845531463623047, -0.17972278594970703, -0.17489242553710938, -0.17006206512451172, -0.16523170471191406, -0.1604013442993164, -0.15557098388671875, -0.1507406234741211, -0.14591026306152344, -0.14107990264892578, -0.13624954223632812, -0.13141918182373047, -0.1265888214111328, -0.12175846099853516, -0.1169281005859375, -0.11209774017333984, -0.10726737976074219, -0.10243701934814453, -0.09760665893554688, -0.09277629852294922, -0.08794593811035156, -0.0831155776977539, -0.07828521728515625, -0.0734548568725586, -0.06862449645996094, -0.06379413604736328, -0.058963775634765625, -0.05413341522216797, -0.04930305480957031, -0.044472694396972656, -0.039642333984375, -0.034811973571777344, -0.029981613159179688, -0.02515125274658203, -0.020320892333984375, -0.015490531921386719, -0.010660171508789062, -0.005829811096191406, -0.00099945068359375, 0.0038309097290039062, 0.008661270141601562, 0.013491630554199219, 0.018321990966796875, 0.02315235137939453, 0.027982711791992188, 0.032813072204589844, 0.0376434326171875, 0.042473793029785156, 0.04730415344238281, 0.05213451385498047, 0.056964874267578125, 0.06179523468017578, 0.06662559509277344, 0.0714559555053711, 0.07628631591796875, 0.0811166763305664, 0.08594703674316406, 0.09077739715576172, 0.09560775756835938, 0.10043811798095703, 0.10526847839355469, 0.11009883880615234, 0.11492919921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 2.0, 14.0, 11.0, 13.0, 21.0, 23.0, 26.0, 61.0, 86.0, 95.0, 84.0, 115.0, 89.0, 68.0, 64.0, 48.0, 51.0, 23.0, 20.0, 19.0, 19.0, 7.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3882598876953125e-05, -5.235709249973297e-05, -5.083158612251282e-05, -4.9306079745292664e-05, -4.778057336807251e-05, -4.6255066990852356e-05, -4.47295606136322e-05, -4.320405423641205e-05, -4.1678547859191895e-05, -4.015304148197174e-05, -3.862753510475159e-05, -3.710202872753143e-05, -3.557652235031128e-05, -3.4051015973091125e-05, -3.252550959587097e-05, -3.100000321865082e-05, -2.9474496841430664e-05, -2.794899046421051e-05, -2.6423484086990356e-05, -2.4897977709770203e-05, -2.337247133255005e-05, -2.1846964955329895e-05, -2.032145857810974e-05, -1.8795952200889587e-05, -1.7270445823669434e-05, -1.574493944644928e-05, -1.4219433069229126e-05, -1.2693926692008972e-05, -1.1168420314788818e-05, -9.642913937568665e-06, -8.11740756034851e-06, -6.591901183128357e-06, -5.066394805908203e-06, -3.5408884286880493e-06, -2.0153820514678955e-06, -4.898756742477417e-07, 1.0356307029724121e-06, 2.561137080192566e-06, 4.08664345741272e-06, 5.6121498346328735e-06, 7.137656211853027e-06, 8.663162589073181e-06, 1.0188668966293335e-05, 1.1714175343513489e-05, 1.3239681720733643e-05, 1.4765188097953796e-05, 1.629069447517395e-05, 1.7816200852394104e-05, 1.9341707229614258e-05, 2.086721360683441e-05, 2.2392719984054565e-05, 2.391822636127472e-05, 2.5443732738494873e-05, 2.6969239115715027e-05, 2.849474549293518e-05, 3.0020251870155334e-05, 3.154575824737549e-05, 3.307126462459564e-05, 3.4596771001815796e-05, 3.612227737903595e-05, 3.7647783756256104e-05, 3.917329013347626e-05, 4.069879651069641e-05, 4.2224302887916565e-05, 4.374980926513672e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 11.0, 3.0, 3.0, 15.0, 9.0, 23.0, 24.0, 32.0, 43.0, 74.0, 105.0, 152.0, 214.0, 368.0, 639.0, 1365.0, 3134.0, 8486.0, 28872.0, 125412.0, 687716.0, 143615.0, 32135.0, 9405.0, 3405.0, 1445.0, 713.0, 379.0, 233.0, 155.0, 93.0, 70.0, 62.0, 38.0, 30.0, 22.0, 12.0, 11.0, 10.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0836181640625, -0.08096694946289062, -0.07831573486328125, -0.07566452026367188, -0.0730133056640625, -0.07036209106445312, -0.06771087646484375, -0.06505966186523438, -0.062408447265625, -0.059757232666015625, -0.05710601806640625, -0.054454803466796875, -0.0518035888671875, -0.049152374267578125, -0.04650115966796875, -0.043849945068359375, -0.04119873046875, -0.038547515869140625, -0.03589630126953125, -0.033245086669921875, -0.0305938720703125, -0.027942657470703125, -0.02529144287109375, -0.022640228271484375, -0.019989013671875, -0.017337799072265625, -0.01468658447265625, -0.012035369873046875, -0.0093841552734375, -0.006732940673828125, -0.00408172607421875, -0.001430511474609375, 0.001220703125, 0.003871917724609375, 0.00652313232421875, 0.009174346923828125, 0.0118255615234375, 0.014476776123046875, 0.01712799072265625, 0.019779205322265625, 0.022430419921875, 0.025081634521484375, 0.02773284912109375, 0.030384063720703125, 0.0330352783203125, 0.035686492919921875, 0.03833770751953125, 0.040988922119140625, 0.04364013671875, 0.046291351318359375, 0.04894256591796875, 0.051593780517578125, 0.0542449951171875, 0.056896209716796875, 0.05954742431640625, 0.062198638916015625, 0.064849853515625, 0.06750106811523438, 0.07015228271484375, 0.07280349731445312, 0.0754547119140625, 0.07810592651367188, 0.08075714111328125, 0.08340835571289062, 0.0860595703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 8.0, 8.0, 11.0, 12.0, 19.0, 17.0, 21.0, 21.0, 43.0, 56.0, 77.0, 91.0, 100.0, 98.0, 98.0, 72.0, 49.0, 42.0, 40.0, 27.0, 25.0, 18.0, 8.0, 10.0, 3.0, 3.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.09019088745117188, -0.08718109130859375, -0.08417129516601562, -0.0811614990234375, -0.07815170288085938, -0.07514190673828125, -0.07213211059570312, -0.069122314453125, -0.06611251831054688, -0.06310272216796875, -0.060092926025390625, -0.0570831298828125, -0.054073333740234375, -0.05106353759765625, -0.048053741455078125, -0.0450439453125, -0.042034149169921875, -0.03902435302734375, -0.036014556884765625, -0.0330047607421875, -0.029994964599609375, -0.02698516845703125, -0.023975372314453125, -0.020965576171875, -0.017955780029296875, -0.01494598388671875, -0.011936187744140625, -0.0089263916015625, -0.005916595458984375, -0.00290679931640625, 0.000102996826171875, 0.00311279296875, 0.006122589111328125, 0.00913238525390625, 0.012142181396484375, 0.0151519775390625, 0.018161773681640625, 0.02117156982421875, 0.024181365966796875, 0.027191162109375, 0.030200958251953125, 0.03321075439453125, 0.036220550537109375, 0.0392303466796875, 0.042240142822265625, 0.04524993896484375, 0.048259735107421875, 0.05126953125, 0.054279327392578125, 0.05728912353515625, 0.060298919677734375, 0.0633087158203125, 0.06631851196289062, 0.06932830810546875, 0.07233810424804688, 0.075347900390625, 0.07835769653320312, 0.08136749267578125, 0.08437728881835938, 0.0873870849609375, 0.09039688110351562, 0.09340667724609375, 0.09641647338867188, 0.09942626953125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 12.0, 29.0, 133.0, 494.0, 239.0, 58.0, 15.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.761096477508545, -7.583735466003418, -7.406374931335449, -7.229013919830322, -7.051652908325195, -6.874292373657227, -6.6969313621521, -6.519570350646973, -6.342209815979004, -6.164848804473877, -5.987488269805908, -5.810127258300781, -5.6327667236328125, -5.4554057121276855, -5.278044700622559, -5.10068416595459, -4.923323154449463, -4.745962142944336, -4.568601608276367, -4.39124059677124, -4.213879585266113, -4.0365190505981445, -3.8591580390930176, -3.6817972660064697, -3.504436492919922, -3.327075719833374, -3.149714946746826, -2.972353935241699, -2.7949931621551514, -2.6176323890686035, -2.4402713775634766, -2.2629106044769287, -2.085550308227539, -1.9081895351409912, -1.7308286428451538, -1.5534677505493164, -1.3761069774627686, -1.1987462043762207, -1.0213853120803833, -0.8440244197845459, -0.666663646697998, -0.4893028140068054, -0.3119419813156128, -0.13458114862442017, 0.04277968406677246, 0.2201405167579651, 0.3975013494491577, 0.5748622417449951, 0.752223014831543, 0.9295838475227356, 1.1069446802139282, 1.2843055725097656, 1.4616663455963135, 1.6390271186828613, 1.8163880109786987, 1.9937489032745361, 2.171109676361084, 2.348470449447632, 2.5258312225341797, 2.7031922340393066, 2.8805530071258545, 3.0579137802124023, 3.2352747917175293, 3.412635564804077, 3.589996337890625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 3.0, 5.0, 5.0, 7.0, 10.0, 10.0, 14.0, 11.0, 18.0, 19.0, 13.0, 24.0, 31.0, 29.0, 32.0, 39.0, 52.0, 56.0, 99.0, 83.0, 72.0, 47.0, 34.0, 33.0, 29.0, 26.0, 24.0, 14.0, 23.0, 16.0, 16.0, 16.0, 12.0, 13.0, 9.0, 12.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6487575769424438, -1.5938482284545898, -1.5389389991760254, -1.4840296506881714, -1.4291203022003174, -1.374211072921753, -1.319301724433899, -1.264392375946045, -1.2094831466674805, -1.1545737981796265, -1.099664568901062, -1.044755220413208, -0.9898459315299988, -0.9349366426467896, -0.8800272941589355, -0.8251180052757263, -0.7702087163925171, -0.7152994275093079, -0.6603901386260986, -0.6054807901382446, -0.5505715012550354, -0.49566221237182617, -0.44075289368629456, -0.38584357500076294, -0.3309342861175537, -0.2760249972343445, -0.22111567854881287, -0.16620637476444244, -0.11129707098007202, -0.05638778209686279, -0.0014784634113311768, 0.05343085527420044, 0.10834002494812012, 0.16324932873249054, 0.21815863251686096, 0.2730679512023926, 0.3279772400856018, 0.38288652896881104, 0.43779584765434265, 0.49270516633987427, 0.5476144552230835, 0.6025237441062927, 0.657433032989502, 0.712342381477356, 0.7672516703605652, 0.8221609592437744, 0.8770703077316284, 0.9319795966148376, 0.9868888854980469, 1.0417982339859009, 1.0967074632644653, 1.1516168117523193, 1.2065260410308838, 1.2614353895187378, 1.3163447380065918, 1.3712539672851562, 1.4261633157730103, 1.4810726642608643, 1.5359818935394287, 1.5908912420272827, 1.6458005905151367, 1.7007098197937012, 1.7556191682815552, 1.8105285167694092, 1.8654377460479736]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 2.0, 3.0, 10.0, 14.0, 14.0, 25.0, 39.0, 59.0, 104.0, 194.0, 464.0, 1032.0, 3548.0, 19709.0, 313356.0, 3271640.0, 550302.0, 26952.0, 4550.0, 1224.0, 463.0, 243.0, 122.0, 73.0, 35.0, 30.0, 26.0, 7.0, 13.0, 8.0, 6.0, 3.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.25140380859375, -0.2415771484375, -0.23175048828125, -0.221923828125, -0.21209716796875, -0.2022705078125, -0.19244384765625, -0.1826171875, -0.17279052734375, -0.1629638671875, -0.15313720703125, -0.143310546875, -0.13348388671875, -0.1236572265625, -0.11383056640625, -0.10400390625, -0.09417724609375, -0.0843505859375, -0.07452392578125, -0.064697265625, -0.05487060546875, -0.0450439453125, -0.03521728515625, -0.025390625, -0.01556396484375, -0.0057373046875, 0.00408935546875, 0.013916015625, 0.02374267578125, 0.0335693359375, 0.04339599609375, 0.05322265625, 0.06304931640625, 0.0728759765625, 0.08270263671875, 0.092529296875, 0.10235595703125, 0.1121826171875, 0.12200927734375, 0.1318359375, 0.14166259765625, 0.1514892578125, 0.16131591796875, 0.171142578125, 0.18096923828125, 0.1907958984375, 0.20062255859375, 0.21044921875, 0.22027587890625, 0.2301025390625, 0.23992919921875, 0.249755859375, 0.25958251953125, 0.2694091796875, 0.27923583984375, 0.2890625, 0.29888916015625, 0.3087158203125, 0.31854248046875, 0.328369140625, 0.33819580078125, 0.3480224609375, 0.35784912109375, 0.36767578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 3.0, 7.0, 9.0, 14.0, 30.0, 30.0, 50.0, 62.0, 62.0, 66.0, 76.0, 89.0, 72.0, 61.0, 73.0, 81.0, 46.0, 42.0, 30.0, 29.0, 17.0, 19.0, 10.0, 8.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24883651733398438, -0.24108123779296875, -0.23332595825195312, -0.2255706787109375, -0.21781539916992188, -0.21006011962890625, -0.20230484008789062, -0.194549560546875, -0.18679428100585938, -0.17903900146484375, -0.17128372192382812, -0.1635284423828125, -0.15577316284179688, -0.14801788330078125, -0.14026260375976562, -0.13250732421875, -0.12475204467773438, -0.11699676513671875, -0.10924148559570312, -0.1014862060546875, -0.09373092651367188, -0.08597564697265625, -0.07822036743164062, -0.070465087890625, -0.06270980834960938, -0.05495452880859375, -0.047199249267578125, -0.0394439697265625, -0.031688690185546875, -0.02393341064453125, -0.016178131103515625, -0.0084228515625, -0.000667572021484375, 0.00708770751953125, 0.014842987060546875, 0.0225982666015625, 0.030353546142578125, 0.03810882568359375, 0.045864105224609375, 0.053619384765625, 0.061374664306640625, 0.06912994384765625, 0.07688522338867188, 0.0846405029296875, 0.09239578247070312, 0.10015106201171875, 0.10790634155273438, 0.11566162109375, 0.12341690063476562, 0.13117218017578125, 0.13892745971679688, 0.1466827392578125, 0.15443801879882812, 0.16219329833984375, 0.16994857788085938, 0.177703857421875, 0.18545913696289062, 0.19321441650390625, 0.20096969604492188, 0.2087249755859375, 0.21648025512695312, 0.22423553466796875, 0.23199081420898438, 0.23974609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 12.0, 10.0, 20.0, 18.0, 41.0, 66.0, 110.0, 235.0, 479.0, 1212.0, 4839.0, 40969.0, 2280726.0, 1823874.0, 35341.0, 4308.0, 1067.0, 439.0, 207.0, 101.0, 74.0, 35.0, 33.0, 19.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.330810546875, -0.3189849853515625, -0.307159423828125, -0.2953338623046875, -0.28350830078125, -0.2716827392578125, -0.259857177734375, -0.2480316162109375, -0.2362060546875, -0.2243804931640625, -0.212554931640625, -0.2007293701171875, -0.18890380859375, -0.1770782470703125, -0.165252685546875, -0.1534271240234375, -0.1416015625, -0.1297760009765625, -0.117950439453125, -0.1061248779296875, -0.09429931640625, -0.0824737548828125, -0.070648193359375, -0.0588226318359375, -0.0469970703125, -0.0351715087890625, -0.023345947265625, -0.0115203857421875, 0.00030517578125, 0.0121307373046875, 0.023956298828125, 0.0357818603515625, 0.047607421875, 0.0594329833984375, 0.071258544921875, 0.0830841064453125, 0.09490966796875, 0.1067352294921875, 0.118560791015625, 0.1303863525390625, 0.1422119140625, 0.1540374755859375, 0.165863037109375, 0.1776885986328125, 0.18951416015625, 0.2013397216796875, 0.213165283203125, 0.2249908447265625, 0.23681640625, 0.2486419677734375, 0.260467529296875, 0.2722930908203125, 0.28411865234375, 0.2959442138671875, 0.307769775390625, 0.3195953369140625, 0.3314208984375, 0.3432464599609375, 0.355072021484375, 0.3668975830078125, 0.37872314453125, 0.3905487060546875, 0.402374267578125, 0.4141998291015625, 0.426025390625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 4.0, 6.0, 18.0, 17.0, 25.0, 31.0, 42.0, 56.0, 72.0, 131.0, 239.0, 371.0, 460.0, 594.0, 543.0, 462.0, 342.0, 207.0, 150.0, 94.0, 54.0, 25.0, 29.0, 30.0, 22.0, 12.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238525390625, -0.23054885864257812, -0.22257232666015625, -0.21459579467773438, -0.2066192626953125, -0.19864273071289062, -0.19066619873046875, -0.18268966674804688, -0.174713134765625, -0.16673660278320312, -0.15876007080078125, -0.15078353881835938, -0.1428070068359375, -0.13483047485351562, -0.12685394287109375, -0.11887741088867188, -0.11090087890625, -0.10292434692382812, -0.09494781494140625, -0.08697128295898438, -0.0789947509765625, -0.07101821899414062, -0.06304168701171875, -0.055065155029296875, -0.047088623046875, -0.039112091064453125, -0.03113555908203125, -0.023159027099609375, -0.0151824951171875, -0.007205963134765625, 0.00077056884765625, 0.008747100830078125, 0.0167236328125, 0.024700164794921875, 0.03267669677734375, 0.040653228759765625, 0.0486297607421875, 0.056606292724609375, 0.06458282470703125, 0.07255935668945312, 0.080535888671875, 0.08851242065429688, 0.09648895263671875, 0.10446548461914062, 0.1124420166015625, 0.12041854858398438, 0.12839508056640625, 0.13637161254882812, 0.14434814453125, 0.15232467651367188, 0.16030120849609375, 0.16827774047851562, 0.1762542724609375, 0.18423080444335938, 0.19220733642578125, 0.20018386840820312, 0.208160400390625, 0.21613693237304688, 0.22411346435546875, 0.23208999633789062, 0.2400665283203125, 0.24804306030273438, 0.25601959228515625, 0.2639961242675781, 0.27197265625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 11.0, 12.0, 62.0, 142.0, 282.0, 255.0, 138.0, 63.0, 21.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2180449962615967, -3.0988314151763916, -2.9796178340911865, -2.8604042530059814, -2.7411906719207764, -2.6219770908355713, -2.502763271331787, -2.383549690246582, -2.264336109161377, -2.145122528076172, -2.025908946990967, -1.9066953659057617, -1.7874817848205566, -1.6682682037353516, -1.549054503440857, -1.4298409223556519, -1.3106274604797363, -1.1914138793945312, -1.0722002983093262, -0.9529866576194763, -0.8337730765342712, -0.7145594954490662, -0.5953458547592163, -0.47613227367401123, -0.35691869258880615, -0.23770509660243988, -0.11849150061607361, 0.0007221102714538574, 0.11993569135665894, 0.239149272441864, 0.35836291313171387, 0.47757649421691895, 0.5967898368835449, 0.71600341796875, 0.8352169990539551, 0.9544306397438049, 1.0736441612243652, 1.1928577423095703, 1.312071442604065, 1.43128502368927, 1.550498604774475, 1.6697121858596802, 1.7889257669448853, 1.9081394672393799, 2.027353048324585, 2.14656662940979, 2.265780210494995, 2.3849937915802, 2.5042073726654053, 2.6234209537506104, 2.7426345348358154, 2.8618481159210205, 2.9810616970062256, 3.1002752780914307, 3.219489097595215, 3.33870267868042, 3.457916259765625, 3.57712984085083, 3.696343421936035, 3.8155570030212402, 3.9347705841064453, 4.05398416519165, 4.1731977462768555, 4.2924113273620605, 4.411624908447266]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 10.0, 12.0, 8.0, 14.0, 19.0, 26.0, 21.0, 33.0, 44.0, 29.0, 46.0, 60.0, 54.0, 72.0, 73.0, 74.0, 63.0, 53.0, 36.0, 58.0, 27.0, 28.0, 26.0, 21.0, 17.0, 14.0, 12.0, 10.0, 9.0, 6.0, 2.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.88785982131958, -1.8361716270446777, -1.784483551979065, -1.7327953577041626, -1.6811072826385498, -1.6294190883636475, -1.5777310132980347, -1.5260428190231323, -1.4743547439575195, -1.4226665496826172, -1.3709784746170044, -1.319290280342102, -1.2676022052764893, -1.215914011001587, -1.1642259359359741, -1.1125377416610718, -1.060849666595459, -1.0091614723205566, -0.9574733972549438, -0.9057852625846863, -0.8540971279144287, -0.8024089336395264, -0.7507208585739136, -0.6990326642990112, -0.6473444700241089, -0.5956563353538513, -0.5439682006835938, -0.4922800660133362, -0.4405919313430786, -0.38890376687049866, -0.3372156322002411, -0.2855274975299835, -0.23383939266204834, -0.18215125799179077, -0.1304631233215332, -0.07877497375011444, -0.027086839079856873, 0.02460131049156189, 0.07628944516181946, 0.12797757983207703, 0.1796657145023346, 0.23135384917259216, 0.28304198384284973, 0.3347301483154297, 0.38641828298568726, 0.4381064176559448, 0.4897945523262024, 0.54148268699646, 0.5931708216667175, 0.6448589563369751, 0.6965470910072327, 0.7482352256774902, 0.7999233603477478, 0.8516114950180054, 0.9032996892929077, 0.9549877643585205, 1.0066759586334229, 1.0583641529083252, 1.110052227973938, 1.1617404222488403, 1.2134284973144531, 1.2651166915893555, 1.3168047666549683, 1.3684929609298706, 1.4201810359954834]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 4.0, 7.0, 24.0, 30.0, 32.0, 40.0, 92.0, 151.0, 241.0, 533.0, 1055.0, 2456.0, 6481.0, 22572.0, 115701.0, 600395.0, 242838.0, 39423.0, 10201.0, 3381.0, 1394.0, 684.0, 345.0, 181.0, 103.0, 76.0, 41.0, 26.0, 17.0, 8.0, 8.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.41552734375, -0.4042015075683594, -0.39287567138671875, -0.3815498352050781, -0.3702239990234375, -0.3588981628417969, -0.34757232666015625, -0.3362464904785156, -0.324920654296875, -0.3135948181152344, -0.30226898193359375, -0.2909431457519531, -0.2796173095703125, -0.2682914733886719, -0.25696563720703125, -0.24563980102539062, -0.23431396484375, -0.22298812866210938, -0.21166229248046875, -0.20033645629882812, -0.1890106201171875, -0.17768478393554688, -0.16635894775390625, -0.15503311157226562, -0.143707275390625, -0.13238143920898438, -0.12105560302734375, -0.10972976684570312, -0.0984039306640625, -0.08707809448242188, -0.07575225830078125, -0.06442642211914062, -0.0531005859375, -0.041774749755859375, -0.03044891357421875, -0.019123077392578125, -0.0077972412109375, 0.003528594970703125, 0.01485443115234375, 0.026180267333984375, 0.037506103515625, 0.048831939697265625, 0.06015777587890625, 0.07148361206054688, 0.0828094482421875, 0.09413528442382812, 0.10546112060546875, 0.11678695678710938, 0.12811279296875, 0.13943862915039062, 0.15076446533203125, 0.16209030151367188, 0.1734161376953125, 0.18474197387695312, 0.19606781005859375, 0.20739364624023438, 0.218719482421875, 0.23004531860351562, 0.24137115478515625, 0.2526969909667969, 0.2640228271484375, 0.2753486633300781, 0.28667449951171875, 0.2980003356933594, 0.309326171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 6.0, 11.0, 12.0, 16.0, 29.0, 36.0, 53.0, 54.0, 77.0, 66.0, 80.0, 64.0, 80.0, 83.0, 73.0, 59.0, 54.0, 31.0, 42.0, 18.0, 8.0, 15.0, 10.0, 10.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.248046875, -0.240234375, -0.232421875, -0.224609375, -0.216796875, -0.208984375, -0.201171875, -0.193359375, -0.185546875, -0.177734375, -0.169921875, -0.162109375, -0.154296875, -0.146484375, -0.138671875, -0.130859375, -0.123046875, -0.115234375, -0.107421875, -0.099609375, -0.091796875, -0.083984375, -0.076171875, -0.068359375, -0.060546875, -0.052734375, -0.044921875, -0.037109375, -0.029296875, -0.021484375, -0.013671875, -0.005859375, 0.001953125, 0.009765625, 0.017578125, 0.025390625, 0.033203125, 0.041015625, 0.048828125, 0.056640625, 0.064453125, 0.072265625, 0.080078125, 0.087890625, 0.095703125, 0.103515625, 0.111328125, 0.119140625, 0.126953125, 0.134765625, 0.142578125, 0.150390625, 0.158203125, 0.166015625, 0.173828125, 0.181640625, 0.189453125, 0.197265625, 0.205078125, 0.212890625, 0.220703125, 0.228515625, 0.236328125, 0.244140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 13.0, 14.0, 14.0, 28.0, 39.0, 62.0, 79.0, 117.0, 191.0, 256.0, 452.0, 768.0, 1545.0, 4550.0, 50053.0, 928984.0, 53125.0, 4647.0, 1550.0, 750.0, 474.0, 266.0, 179.0, 123.0, 73.0, 62.0, 40.0, 30.0, 20.0, 10.0, 13.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7041015625, -0.6842727661132812, -0.6644439697265625, -0.6446151733398438, -0.624786376953125, -0.6049575805664062, -0.5851287841796875, -0.5652999877929688, -0.54547119140625, -0.5256423950195312, -0.5058135986328125, -0.48598480224609375, -0.466156005859375, -0.44632720947265625, -0.4264984130859375, -0.40666961669921875, -0.3868408203125, -0.36701202392578125, -0.3471832275390625, -0.32735443115234375, -0.307525634765625, -0.28769683837890625, -0.2678680419921875, -0.24803924560546875, -0.22821044921875, -0.20838165283203125, -0.1885528564453125, -0.16872406005859375, -0.148895263671875, -0.12906646728515625, -0.1092376708984375, -0.08940887451171875, -0.069580078125, -0.04975128173828125, -0.0299224853515625, -0.01009368896484375, 0.009735107421875, 0.02956390380859375, 0.0493927001953125, 0.06922149658203125, 0.08905029296875, 0.10887908935546875, 0.1287078857421875, 0.14853668212890625, 0.168365478515625, 0.18819427490234375, 0.2080230712890625, 0.22785186767578125, 0.2476806640625, 0.26750946044921875, 0.2873382568359375, 0.30716705322265625, 0.326995849609375, 0.34682464599609375, 0.3666534423828125, 0.38648223876953125, 0.40631103515625, 0.42613983154296875, 0.4459686279296875, 0.46579742431640625, 0.485626220703125, 0.5054550170898438, 0.5252838134765625, 0.5451126098632812, 0.56494140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 3.0, 4.0, 6.0, 8.0, 12.0, 14.0, 14.0, 33.0, 32.0, 38.0, 46.0, 52.0, 57.0, 51.0, 71.0, 82.0, 70.0, 77.0, 52.0, 60.0, 35.0, 37.0, 35.0, 23.0, 22.0, 17.0, 13.0, 8.0, 8.0, 10.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5635757446289062, -0.5417022705078125, -0.5198287963867188, -0.497955322265625, -0.47608184814453125, -0.4542083740234375, -0.43233489990234375, -0.41046142578125, -0.38858795166015625, -0.3667144775390625, -0.34484100341796875, -0.322967529296875, -0.30109405517578125, -0.2792205810546875, -0.25734710693359375, -0.2354736328125, -0.21360015869140625, -0.1917266845703125, -0.16985321044921875, -0.147979736328125, -0.12610626220703125, -0.1042327880859375, -0.08235931396484375, -0.06048583984375, -0.03861236572265625, -0.0167388916015625, 0.00513458251953125, 0.027008056640625, 0.04888153076171875, 0.0707550048828125, 0.09262847900390625, 0.114501953125, 0.13637542724609375, 0.1582489013671875, 0.18012237548828125, 0.201995849609375, 0.22386932373046875, 0.2457427978515625, 0.26761627197265625, 0.28948974609375, 0.31136322021484375, 0.3332366943359375, 0.35511016845703125, 0.376983642578125, 0.39885711669921875, 0.4207305908203125, 0.44260406494140625, 0.4644775390625, 0.48635101318359375, 0.5082244873046875, 0.5300979614257812, 0.551971435546875, 0.5738449096679688, 0.5957183837890625, 0.6175918579101562, 0.63946533203125, 0.6613388061523438, 0.6832122802734375, 0.7050857543945312, 0.726959228515625, 0.7488327026367188, 0.7707061767578125, 0.7925796508789062, 0.814453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 5.0, 5.0, 2.0, 4.0, 12.0, 8.0, 6.0, 7.0, 19.0, 22.0, 26.0, 36.0, 66.0, 106.0, 156.0, 277.0, 630.0, 1945.0, 10421.0, 323096.0, 696171.0, 11843.0, 2168.0, 750.0, 301.0, 155.0, 80.0, 60.0, 52.0, 28.0, 19.0, 17.0, 7.0, 10.0, 7.0, 3.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2138671875, -0.20718955993652344, -0.20051193237304688, -0.1938343048095703, -0.18715667724609375, -0.1804790496826172, -0.17380142211914062, -0.16712379455566406, -0.1604461669921875, -0.15376853942871094, -0.14709091186523438, -0.1404132843017578, -0.13373565673828125, -0.1270580291748047, -0.12038040161132812, -0.11370277404785156, -0.107025146484375, -0.10034751892089844, -0.09366989135742188, -0.08699226379394531, -0.08031463623046875, -0.07363700866699219, -0.06695938110351562, -0.06028175354003906, -0.0536041259765625, -0.04692649841308594, -0.040248870849609375, -0.03357124328613281, -0.02689361572265625, -0.020215988159179688, -0.013538360595703125, -0.0068607330322265625, -0.00018310546875, 0.0064945220947265625, 0.013172149658203125, 0.019849777221679688, 0.02652740478515625, 0.03320503234863281, 0.039882659912109375, 0.04656028747558594, 0.0532379150390625, 0.05991554260253906, 0.06659317016601562, 0.07327079772949219, 0.07994842529296875, 0.08662605285644531, 0.09330368041992188, 0.09998130798339844, 0.106658935546875, 0.11333656311035156, 0.12001419067382812, 0.1266918182373047, 0.13336944580078125, 0.1400470733642578, 0.14672470092773438, 0.15340232849121094, 0.1600799560546875, 0.16675758361816406, 0.17343521118164062, 0.1801128387451172, 0.18679046630859375, 0.1934680938720703, 0.20014572143554688, 0.20682334899902344, 0.2135009765625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 13.0, 4.0, 7.0, 10.0, 9.0, 13.0, 19.0, 28.0, 28.0, 41.0, 70.0, 97.0, 121.0, 126.0, 101.0, 84.0, 60.0, 36.0, 22.0, 25.0, 14.0, 10.0, 14.0, 10.0, 7.0, 7.0, 7.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.70823860168457e-05, -8.492451161146164e-05, -8.276663720607758e-05, -8.060876280069351e-05, -7.845088839530945e-05, -7.629301398992538e-05, -7.413513958454132e-05, -7.197726517915726e-05, -6.98193907737732e-05, -6.766151636838913e-05, -6.550364196300507e-05, -6.3345767557621e-05, -6.118789315223694e-05, -5.9030018746852875e-05, -5.687214434146881e-05, -5.471426993608475e-05, -5.2556395530700684e-05, -5.039852112531662e-05, -4.8240646719932556e-05, -4.608277231454849e-05, -4.392489790916443e-05, -4.1767023503780365e-05, -3.96091490983963e-05, -3.745127469301224e-05, -3.5293400287628174e-05, -3.313552588224411e-05, -3.0977651476860046e-05, -2.8819777071475983e-05, -2.666190266609192e-05, -2.4504028260707855e-05, -2.234615385532379e-05, -2.0188279449939728e-05, -1.8030405044555664e-05, -1.58725306391716e-05, -1.3714656233787537e-05, -1.1556781828403473e-05, -9.39890742301941e-06, -7.2410330176353455e-06, -5.083158612251282e-06, -2.925284206867218e-06, -7.674098014831543e-07, 1.3904646039009094e-06, 3.548339009284973e-06, 5.706213414669037e-06, 7.8640878200531e-06, 1.0021962225437164e-05, 1.2179836630821228e-05, 1.4337711036205292e-05, 1.6495585441589355e-05, 1.865345984697342e-05, 2.0811334252357483e-05, 2.2969208657741547e-05, 2.512708306312561e-05, 2.7284957468509674e-05, 2.9442831873893738e-05, 3.16007062792778e-05, 3.3758580684661865e-05, 3.591645509004593e-05, 3.807432949542999e-05, 4.0232203900814056e-05, 4.239007830619812e-05, 4.4547952711582184e-05, 4.670582711696625e-05, 4.886370152235031e-05, 5.1021575927734375e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 13.0, 26.0, 28.0, 32.0, 53.0, 69.0, 107.0, 212.0, 333.0, 766.0, 1861.0, 6638.0, 44071.0, 859691.0, 118687.0, 11114.0, 2738.0, 1017.0, 472.0, 211.0, 121.0, 75.0, 51.0, 19.0, 22.0, 13.0, 17.0, 15.0, 13.0, 16.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1497802734375, -0.14533233642578125, -0.1408843994140625, -0.13643646240234375, -0.131988525390625, -0.12754058837890625, -0.1230926513671875, -0.11864471435546875, -0.11419677734375, -0.10974884033203125, -0.1053009033203125, -0.10085296630859375, -0.096405029296875, -0.09195709228515625, -0.0875091552734375, -0.08306121826171875, -0.07861328125, -0.07416534423828125, -0.0697174072265625, -0.06526947021484375, -0.060821533203125, -0.05637359619140625, -0.0519256591796875, -0.04747772216796875, -0.04302978515625, -0.03858184814453125, -0.0341339111328125, -0.02968597412109375, -0.025238037109375, -0.02079010009765625, -0.0163421630859375, -0.01189422607421875, -0.0074462890625, -0.00299835205078125, 0.0014495849609375, 0.00589752197265625, 0.010345458984375, 0.01479339599609375, 0.0192413330078125, 0.02368927001953125, 0.02813720703125, 0.03258514404296875, 0.0370330810546875, 0.04148101806640625, 0.045928955078125, 0.05037689208984375, 0.0548248291015625, 0.05927276611328125, 0.063720703125, 0.06816864013671875, 0.0726165771484375, 0.07706451416015625, 0.081512451171875, 0.08596038818359375, 0.0904083251953125, 0.09485626220703125, 0.09930419921875, 0.10375213623046875, 0.1082000732421875, 0.11264801025390625, 0.117095947265625, 0.12154388427734375, 0.1259918212890625, 0.13043975830078125, 0.1348876953125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 12.0, 17.0, 16.0, 27.0, 46.0, 58.0, 95.0, 131.0, 163.0, 116.0, 91.0, 77.0, 34.0, 32.0, 19.0, 7.0, 8.0, 4.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14802932739257812, -0.14395904541015625, -0.13988876342773438, -0.1358184814453125, -0.13174819946289062, -0.12767791748046875, -0.12360763549804688, -0.119537353515625, -0.11546707153320312, -0.11139678955078125, -0.10732650756835938, -0.1032562255859375, -0.09918594360351562, -0.09511566162109375, -0.09104537963867188, -0.08697509765625, -0.08290481567382812, -0.07883453369140625, -0.07476425170898438, -0.0706939697265625, -0.06662368774414062, -0.06255340576171875, -0.058483123779296875, -0.054412841796875, -0.050342559814453125, -0.04627227783203125, -0.042201995849609375, -0.0381317138671875, -0.034061431884765625, -0.02999114990234375, -0.025920867919921875, -0.0218505859375, -0.017780303955078125, -0.01371002197265625, -0.009639739990234375, -0.0055694580078125, -0.001499176025390625, 0.00257110595703125, 0.006641387939453125, 0.010711669921875, 0.014781951904296875, 0.01885223388671875, 0.022922515869140625, 0.0269927978515625, 0.031063079833984375, 0.03513336181640625, 0.039203643798828125, 0.04327392578125, 0.047344207763671875, 0.05141448974609375, 0.055484771728515625, 0.0595550537109375, 0.06362533569335938, 0.06769561767578125, 0.07176589965820312, 0.075836181640625, 0.07990646362304688, 0.08397674560546875, 0.08804702758789062, 0.0921173095703125, 0.09618759155273438, 0.10025787353515625, 0.10432815551757812, 0.1083984375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 38.0, 269.0, 605.0, 54.0, 11.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.463346481323242, -11.2151460647583, -10.96694564819336, -10.718745231628418, -10.470544815063477, -10.222344398498535, -9.974143981933594, -9.725943565368652, -9.477743148803711, -9.22954273223877, -8.981342315673828, -8.733141899108887, -8.484941482543945, -8.236741065979004, -7.9885406494140625, -7.740340232849121, -7.49213981628418, -7.243939399719238, -6.995738983154297, -6.7475385665893555, -6.499338150024414, -6.251137733459473, -6.002937316894531, -5.75473690032959, -5.50653600692749, -5.258335590362549, -5.010135173797607, -4.761934757232666, -4.513734340667725, -4.265533924102783, -4.017333507537842, -3.7691330909729004, -3.520932674407959, -3.2727322578430176, -3.024531841278076, -2.7763314247131348, -2.5281310081481934, -2.279930591583252, -2.0317301750183105, -1.7835296392440796, -1.5353292226791382, -1.2871288061141968, -1.0389283895492554, -0.7907279133796692, -0.5425274968147278, -0.2943270206451416, -0.046126604080200195, 0.2020738124847412, 0.4502742290496826, 0.698474645614624, 0.9466750621795654, 1.1948754787445068, 1.4430758953094482, 1.6912764310836792, 1.9394768476486206, 2.1876773834228516, 2.435877799987793, 2.6840782165527344, 2.932278633117676, 3.180479049682617, 3.4286794662475586, 3.6768798828125, 3.9250802993774414, 4.173280715942383, 4.421481132507324]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 6.0, 4.0, 7.0, 10.0, 13.0, 7.0, 14.0, 13.0, 20.0, 22.0, 26.0, 28.0, 36.0, 51.0, 41.0, 90.0, 183.0, 104.0, 44.0, 45.0, 38.0, 30.0, 32.0, 28.0, 25.0, 15.0, 10.0, 18.0, 7.0, 10.0, 9.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0799918174743652, -2.0016672611236572, -1.9233425855636597, -1.845017910003662, -1.766693353652954, -1.688368797302246, -1.6100441217422485, -1.531719446182251, -1.453394889831543, -1.375070333480835, -1.2967456579208374, -1.2184209823608398, -1.1400964260101318, -1.0617718696594238, -0.9834471940994263, -0.9051225781440735, -0.8267979621887207, -0.7484733462333679, -0.6701487302780151, -0.5918241143226624, -0.5134994983673096, -0.4351748824119568, -0.356850266456604, -0.2785256505012512, -0.20020103454589844, -0.12187641859054565, -0.04355180263519287, 0.03477281332015991, 0.1130974292755127, 0.19142204523086548, 0.26974666118621826, 0.34807127714157104, 0.4263956546783447, 0.5047202706336975, 0.5830448865890503, 0.6613695025444031, 0.7396941184997559, 0.8180187344551086, 0.8963433504104614, 0.9746679663658142, 1.052992582321167, 1.131317138671875, 1.2096418142318726, 1.2879664897918701, 1.3662910461425781, 1.4446156024932861, 1.5229402780532837, 1.6012649536132812, 1.6795895099639893, 1.7579140663146973, 1.8362387418746948, 1.9145634174346924, 1.9928879737854004, 2.0712125301361084, 2.1495370864868164, 2.2278618812561035, 2.3061864376068115, 2.3845109939575195, 2.4628357887268066, 2.5411603450775146, 2.6194849014282227, 2.6978094577789307, 2.7761340141296387, 2.854458808898926, 2.932783365249634]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 12.0, 11.0, 32.0, 30.0, 49.0, 86.0, 173.0, 290.0, 606.0, 1249.0, 3444.0, 12647.0, 87590.0, 1131623.0, 2569648.0, 346927.0, 29322.0, 6534.0, 2161.0, 895.0, 385.0, 215.0, 128.0, 69.0, 40.0, 30.0, 29.0, 13.0, 7.0, 3.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.269775390625, -0.25988006591796875, -0.2499847412109375, -0.24008941650390625, -0.230194091796875, -0.22029876708984375, -0.2104034423828125, -0.20050811767578125, -0.19061279296875, -0.18071746826171875, -0.1708221435546875, -0.16092681884765625, -0.151031494140625, -0.14113616943359375, -0.1312408447265625, -0.12134552001953125, -0.1114501953125, -0.10155487060546875, -0.0916595458984375, -0.08176422119140625, -0.071868896484375, -0.06197357177734375, -0.0520782470703125, -0.04218292236328125, -0.03228759765625, -0.02239227294921875, -0.0124969482421875, -0.00260162353515625, 0.007293701171875, 0.01718902587890625, 0.0270843505859375, 0.03697967529296875, 0.046875, 0.05677032470703125, 0.0666656494140625, 0.07656097412109375, 0.086456298828125, 0.09635162353515625, 0.1062469482421875, 0.11614227294921875, 0.12603759765625, 0.13593292236328125, 0.1458282470703125, 0.15572357177734375, 0.165618896484375, 0.17551422119140625, 0.1854095458984375, 0.19530487060546875, 0.2052001953125, 0.21509552001953125, 0.2249908447265625, 0.23488616943359375, 0.244781494140625, 0.25467681884765625, 0.2645721435546875, 0.27446746826171875, 0.28436279296875, 0.29425811767578125, 0.3041534423828125, 0.31404876708984375, 0.323944091796875, 0.33383941650390625, 0.3437347412109375, 0.35363006591796875, 0.363525390625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 9.0, 15.0, 20.0, 31.0, 37.0, 52.0, 59.0, 74.0, 70.0, 70.0, 82.0, 88.0, 84.0, 72.0, 55.0, 38.0, 43.0, 22.0, 18.0, 9.0, 11.0, 12.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24914169311523438, -0.24144744873046875, -0.23375320434570312, -0.2260589599609375, -0.21836471557617188, -0.21067047119140625, -0.20297622680664062, -0.195281982421875, -0.18758773803710938, -0.17989349365234375, -0.17219924926757812, -0.1645050048828125, -0.15681076049804688, -0.14911651611328125, -0.14142227172851562, -0.13372802734375, -0.12603378295898438, -0.11833953857421875, -0.11064529418945312, -0.1029510498046875, -0.09525680541992188, -0.08756256103515625, -0.07986831665039062, -0.072174072265625, -0.06447982788085938, -0.05678558349609375, -0.049091339111328125, -0.0413970947265625, -0.033702850341796875, -0.02600860595703125, -0.018314361572265625, -0.0106201171875, -0.002925872802734375, 0.00476837158203125, 0.012462615966796875, 0.0201568603515625, 0.027851104736328125, 0.03554534912109375, 0.043239593505859375, 0.050933837890625, 0.058628082275390625, 0.06632232666015625, 0.07401657104492188, 0.0817108154296875, 0.08940505981445312, 0.09709930419921875, 0.10479354858398438, 0.11248779296875, 0.12018203735351562, 0.12787628173828125, 0.13557052612304688, 0.1432647705078125, 0.15095901489257812, 0.15865325927734375, 0.16634750366210938, 0.174041748046875, 0.18173599243164062, 0.18943023681640625, 0.19712448120117188, 0.2048187255859375, 0.21251296997070312, 0.22020721435546875, 0.22790145874023438, 0.235595703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 4.0, 5.0, 10.0, 7.0, 13.0, 29.0, 40.0, 53.0, 85.0, 150.0, 337.0, 796.0, 2110.0, 12138.0, 3662971.0, 503794.0, 8334.0, 1941.0, 703.0, 342.0, 162.0, 97.0, 52.0, 39.0, 22.0, 15.0, 13.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0703125, -1.0367279052734375, -1.003143310546875, -0.9695587158203125, -0.93597412109375, -0.9023895263671875, -0.868804931640625, -0.8352203369140625, -0.8016357421875, -0.7680511474609375, -0.734466552734375, -0.7008819580078125, -0.66729736328125, -0.6337127685546875, -0.600128173828125, -0.5665435791015625, -0.532958984375, -0.4993743896484375, -0.465789794921875, -0.4322052001953125, -0.39862060546875, -0.3650360107421875, -0.331451416015625, -0.2978668212890625, -0.2642822265625, -0.2306976318359375, -0.197113037109375, -0.1635284423828125, -0.12994384765625, -0.0963592529296875, -0.062774658203125, -0.0291900634765625, 0.00439453125, 0.0379791259765625, 0.071563720703125, 0.1051483154296875, 0.13873291015625, 0.1723175048828125, 0.205902099609375, 0.2394866943359375, 0.2730712890625, 0.3066558837890625, 0.340240478515625, 0.3738250732421875, 0.40740966796875, 0.4409942626953125, 0.474578857421875, 0.5081634521484375, 0.541748046875, 0.5753326416015625, 0.608917236328125, 0.6425018310546875, 0.67608642578125, 0.7096710205078125, 0.743255615234375, 0.7768402099609375, 0.8104248046875, 0.8440093994140625, 0.877593994140625, 0.9111785888671875, 0.94476318359375, 0.9783477783203125, 1.011932373046875, 1.0455169677734375, 1.0791015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 5.0, 12.0, 31.0, 68.0, 107.0, 193.0, 379.0, 755.0, 919.0, 674.0, 400.0, 198.0, 118.0, 70.0, 39.0, 30.0, 20.0, 18.0, 6.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.5830078125, -0.55908203125, -0.53515625, -0.51123046875, -0.4873046875, -0.46337890625, -0.439453125, -0.41552734375, -0.3916015625, -0.36767578125, -0.34375, -0.31982421875, -0.2958984375, -0.27197265625, -0.248046875, -0.22412109375, -0.2001953125, -0.17626953125, -0.15234375, -0.12841796875, -0.1044921875, -0.08056640625, -0.056640625, -0.03271484375, -0.0087890625, 0.01513671875, 0.0390625, 0.06298828125, 0.0869140625, 0.11083984375, 0.134765625, 0.15869140625, 0.1826171875, 0.20654296875, 0.23046875, 0.25439453125, 0.2783203125, 0.30224609375, 0.326171875, 0.35009765625, 0.3740234375, 0.39794921875, 0.421875, 0.44580078125, 0.4697265625, 0.49365234375, 0.517578125, 0.54150390625, 0.5654296875, 0.58935546875, 0.61328125, 0.63720703125, 0.6611328125, 0.68505859375, 0.708984375, 0.73291015625, 0.7568359375, 0.78076171875, 0.8046875, 0.82861328125, 0.8525390625, 0.87646484375, 0.900390625, 0.92431640625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 19.0, 41.0, 184.0, 400.0, 207.0, 71.0, 27.0, 14.0, 9.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7272138595581055, -3.363909959793091, -3.000606060028076, -2.6373021602630615, -2.273998260498047, -1.9106943607330322, -1.5473904609680176, -1.184086561203003, -0.8207826614379883, -0.45747876167297363, -0.09417486190795898, 0.26912903785705566, 0.6324329376220703, 0.995736837387085, 1.3590407371520996, 1.7223446369171143, 2.085648536682129, 2.4489524364471436, 2.812256336212158, 3.175560235977173, 3.5388641357421875, 3.902168035507202, 4.265471935272217, 4.628775596618652, 4.992079734802246, 5.35538387298584, 5.718687534332275, 6.081991195678711, 6.445295333862305, 6.808599472045898, 7.171903133392334, 7.5352067947387695, 7.898509979248047, 8.26181411743164, 8.625118255615234, 8.988421440124512, 9.351725578308105, 9.7150297164917, 10.078332901000977, 10.44163703918457, 10.804941177368164, 11.168245315551758, 11.531549453735352, 11.894852638244629, 12.258156776428223, 12.621460914611816, 12.984764099121094, 13.348068237304688, 13.711372375488281, 14.074676513671875, 14.437980651855469, 14.801283836364746, 15.16458797454834, 15.527892112731934, 15.891195297241211, 16.254499435424805, 16.6178035736084, 16.981107711791992, 17.344411849975586, 17.70771598815918, 18.07101821899414, 18.434322357177734, 18.797626495361328, 19.160930633544922, 19.524234771728516]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 1.0, 2.0, 7.0, 6.0, 12.0, 10.0, 14.0, 24.0, 42.0, 40.0, 41.0, 62.0, 53.0, 85.0, 85.0, 89.0, 100.0, 71.0, 49.0, 48.0, 39.0, 32.0, 18.0, 12.0, 16.0, 15.0, 8.0, 5.0, 8.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.228280067443848, -4.069037437438965, -3.909795045852661, -3.7505526542663574, -3.5913100242614746, -3.432067394256592, -3.272825002670288, -3.1135826110839844, -2.9543399810791016, -2.7950973510742188, -2.635854959487915, -2.4766125679016113, -2.3173699378967285, -2.1581273078918457, -1.998884916305542, -1.8396424055099487, -1.6803998947143555, -1.5211573839187622, -1.361914873123169, -1.2026723623275757, -1.0434298515319824, -0.8841873407363892, -0.7249448299407959, -0.5657023191452026, -0.4064598083496094, -0.2472172975540161, -0.08797478675842285, 0.07126772403717041, 0.23051023483276367, 0.38975274562835693, 0.5489952564239502, 0.7082377672195435, 0.8674802780151367, 1.02672278881073, 1.1859652996063232, 1.3452078104019165, 1.5044503211975098, 1.663692831993103, 1.8229353427886963, 1.9821778535842896, 2.141420364379883, 2.3006629943847656, 2.4599053859710693, 2.619147777557373, 2.778390407562256, 2.9376330375671387, 3.0968754291534424, 3.256117820739746, 3.415360450744629, 3.5746030807495117, 3.7338454723358154, 3.893087863922119, 4.052330493927002, 4.211573123931885, 4.370815277099609, 4.530057907104492, 4.689300537109375, 4.848543167114258, 5.007785797119141, 5.167027950286865, 5.326270580291748, 5.485513210296631, 5.6447553634643555, 5.803997993469238, 5.963240623474121]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 5.0, 7.0, 16.0, 24.0, 52.0, 71.0, 91.0, 181.0, 292.0, 603.0, 1397.0, 3445.0, 9769.0, 38503.0, 286642.0, 623168.0, 62477.0, 13858.0, 4615.0, 1715.0, 731.0, 375.0, 176.0, 109.0, 87.0, 40.0, 25.0, 22.0, 12.0, 9.0, 4.0, 12.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3310546875, -0.3207550048828125, -0.310455322265625, -0.3001556396484375, -0.28985595703125, -0.2795562744140625, -0.269256591796875, -0.2589569091796875, -0.2486572265625, -0.2383575439453125, -0.228057861328125, -0.2177581787109375, -0.20745849609375, -0.1971588134765625, -0.186859130859375, -0.1765594482421875, -0.166259765625, -0.1559600830078125, -0.145660400390625, -0.1353607177734375, -0.12506103515625, -0.1147613525390625, -0.104461669921875, -0.0941619873046875, -0.0838623046875, -0.0735626220703125, -0.063262939453125, -0.0529632568359375, -0.04266357421875, -0.0323638916015625, -0.022064208984375, -0.0117645263671875, -0.00146484375, 0.0088348388671875, 0.019134521484375, 0.0294342041015625, 0.03973388671875, 0.0500335693359375, 0.060333251953125, 0.0706329345703125, 0.0809326171875, 0.0912322998046875, 0.101531982421875, 0.1118316650390625, 0.12213134765625, 0.1324310302734375, 0.142730712890625, 0.1530303955078125, 0.163330078125, 0.1736297607421875, 0.183929443359375, 0.1942291259765625, 0.20452880859375, 0.2148284912109375, 0.225128173828125, 0.2354278564453125, 0.2457275390625, 0.2560272216796875, 0.266326904296875, 0.2766265869140625, 0.28692626953125, 0.2972259521484375, 0.307525634765625, 0.3178253173828125, 0.328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 13.0, 24.0, 32.0, 35.0, 57.0, 63.0, 82.0, 76.0, 92.0, 87.0, 83.0, 68.0, 71.0, 45.0, 52.0, 43.0, 20.0, 12.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.24055862426757812, -0.22965240478515625, -0.21874618530273438, -0.2078399658203125, -0.19693374633789062, -0.18602752685546875, -0.17512130737304688, -0.164215087890625, -0.15330886840820312, -0.14240264892578125, -0.13149642944335938, -0.1205902099609375, -0.10968399047851562, -0.09877777099609375, -0.08787155151367188, -0.07696533203125, -0.06605911254882812, -0.05515289306640625, -0.044246673583984375, -0.0333404541015625, -0.022434234619140625, -0.01152801513671875, -0.000621795654296875, 0.010284423828125, 0.021190643310546875, 0.03209686279296875, 0.043003082275390625, 0.0539093017578125, 0.06481552124023438, 0.07572174072265625, 0.08662796020507812, 0.0975341796875, 0.10844039916992188, 0.11934661865234375, 0.13025283813476562, 0.1411590576171875, 0.15206527709960938, 0.16297149658203125, 0.17387771606445312, 0.184783935546875, 0.19569015502929688, 0.20659637451171875, 0.21750259399414062, 0.2284088134765625, 0.23931503295898438, 0.25022125244140625, 0.2611274719238281, 0.27203369140625, 0.2829399108886719, 0.29384613037109375, 0.3047523498535156, 0.3156585693359375, 0.3265647888183594, 0.33747100830078125, 0.3483772277832031, 0.359283447265625, 0.3701896667480469, 0.38109588623046875, 0.3920021057128906, 0.4029083251953125, 0.4138145446777344, 0.42472076416015625, 0.4356269836425781, 0.446533203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 5.0, 9.0, 21.0, 30.0, 40.0, 59.0, 66.0, 112.0, 158.0, 324.0, 586.0, 1390.0, 5097.0, 48773.0, 943722.0, 40878.0, 4572.0, 1323.0, 521.0, 326.0, 174.0, 117.0, 67.0, 54.0, 45.0, 19.0, 10.0, 10.0, 9.0, 7.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.428955078125, -0.4153251647949219, -0.40169525146484375, -0.3880653381347656, -0.3744354248046875, -0.3608055114746094, -0.34717559814453125, -0.3335456848144531, -0.319915771484375, -0.3062858581542969, -0.29265594482421875, -0.2790260314941406, -0.2653961181640625, -0.2517662048339844, -0.23813629150390625, -0.22450637817382812, -0.21087646484375, -0.19724655151367188, -0.18361663818359375, -0.16998672485351562, -0.1563568115234375, -0.14272689819335938, -0.12909698486328125, -0.11546707153320312, -0.101837158203125, -0.08820724487304688, -0.07457733154296875, -0.060947418212890625, -0.0473175048828125, -0.033687591552734375, -0.02005767822265625, -0.006427764892578125, 0.0072021484375, 0.020832061767578125, 0.03446197509765625, 0.048091888427734375, 0.0617218017578125, 0.07535171508789062, 0.08898162841796875, 0.10261154174804688, 0.116241455078125, 0.12987136840820312, 0.14350128173828125, 0.15713119506835938, 0.1707611083984375, 0.18439102172851562, 0.19802093505859375, 0.21165084838867188, 0.22528076171875, 0.23891067504882812, 0.25254058837890625, 0.2661705017089844, 0.2798004150390625, 0.2934303283691406, 0.30706024169921875, 0.3206901550292969, 0.334320068359375, 0.3479499816894531, 0.36157989501953125, 0.3752098083496094, 0.3888397216796875, 0.4024696350097656, 0.41609954833984375, 0.4297294616699219, 0.443359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 6.0, 7.0, 4.0, 8.0, 5.0, 10.0, 10.0, 2.0, 18.0, 16.0, 24.0, 30.0, 39.0, 42.0, 56.0, 52.0, 76.0, 67.0, 83.0, 57.0, 65.0, 47.0, 42.0, 39.0, 27.0, 22.0, 16.0, 16.0, 19.0, 17.0, 9.0, 13.0, 9.0, 6.0, 3.0, 6.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.72265625, -0.7010116577148438, -0.6793670654296875, -0.6577224731445312, -0.636077880859375, -0.6144332885742188, -0.5927886962890625, -0.5711441040039062, -0.54949951171875, -0.5278549194335938, -0.5062103271484375, -0.48456573486328125, -0.462921142578125, -0.44127655029296875, -0.4196319580078125, -0.39798736572265625, -0.3763427734375, -0.35469818115234375, -0.3330535888671875, -0.31140899658203125, -0.289764404296875, -0.26811981201171875, -0.2464752197265625, -0.22483062744140625, -0.20318603515625, -0.18154144287109375, -0.1598968505859375, -0.13825225830078125, -0.116607666015625, -0.09496307373046875, -0.0733184814453125, -0.05167388916015625, -0.030029296875, -0.00838470458984375, 0.0132598876953125, 0.03490447998046875, 0.056549072265625, 0.07819366455078125, 0.0998382568359375, 0.12148284912109375, 0.14312744140625, 0.16477203369140625, 0.1864166259765625, 0.20806121826171875, 0.229705810546875, 0.25135040283203125, 0.2729949951171875, 0.29463958740234375, 0.3162841796875, 0.33792877197265625, 0.3595733642578125, 0.38121795654296875, 0.402862548828125, 0.42450714111328125, 0.4461517333984375, 0.46779632568359375, 0.48944091796875, 0.5110855102539062, 0.5327301025390625, 0.5543746948242188, 0.576019287109375, 0.5976638793945312, 0.6193084716796875, 0.6409530639648438, 0.66259765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 11.0, 10.0, 15.0, 28.0, 18.0, 30.0, 51.0, 79.0, 104.0, 168.0, 248.0, 429.0, 872.0, 1800.0, 4956.0, 19461.0, 212000.0, 773846.0, 24317.0, 5807.0, 2042.0, 966.0, 479.0, 240.0, 159.0, 120.0, 78.0, 46.0, 52.0, 29.0, 23.0, 13.0, 10.0, 10.0, 7.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05438232421875, -0.05257368087768555, -0.050765037536621094, -0.04895639419555664, -0.04714775085449219, -0.045339107513427734, -0.04353046417236328, -0.04172182083129883, -0.039913177490234375, -0.03810453414916992, -0.03629589080810547, -0.034487247467041016, -0.03267860412597656, -0.03086996078491211, -0.029061317443847656, -0.027252674102783203, -0.02544403076171875, -0.023635387420654297, -0.021826744079589844, -0.02001810073852539, -0.018209457397460938, -0.016400814056396484, -0.014592170715332031, -0.012783527374267578, -0.010974884033203125, -0.009166240692138672, -0.007357597351074219, -0.005548954010009766, -0.0037403106689453125, -0.0019316673278808594, -0.00012302398681640625, 0.0016856193542480469, 0.0034942626953125, 0.005302906036376953, 0.007111549377441406, 0.00892019271850586, 0.010728836059570312, 0.012537479400634766, 0.014346122741699219, 0.016154766082763672, 0.017963409423828125, 0.019772052764892578, 0.02158069610595703, 0.023389339447021484, 0.025197982788085938, 0.02700662612915039, 0.028815269470214844, 0.030623912811279297, 0.03243255615234375, 0.0342411994934082, 0.036049842834472656, 0.03785848617553711, 0.03966712951660156, 0.041475772857666016, 0.04328441619873047, 0.04509305953979492, 0.046901702880859375, 0.04871034622192383, 0.05051898956298828, 0.052327632904052734, 0.05413627624511719, 0.05594491958618164, 0.057753562927246094, 0.05956220626831055, 0.061370849609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 7.0, 3.0, 10.0, 16.0, 24.0, 26.0, 51.0, 49.0, 57.0, 80.0, 84.0, 93.0, 92.0, 86.0, 67.0, 56.0, 33.0, 35.0, 28.0, 13.0, 16.0, 16.0, 6.0, 9.0, 7.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4809112548828125e-05, -3.34596261382103e-05, -3.211013972759247e-05, -3.076065331697464e-05, -2.941116690635681e-05, -2.8061680495738983e-05, -2.6712194085121155e-05, -2.5362707674503326e-05, -2.4013221263885498e-05, -2.266373485326767e-05, -2.131424844264984e-05, -1.9964762032032013e-05, -1.8615275621414185e-05, -1.7265789210796356e-05, -1.5916302800178528e-05, -1.45668163895607e-05, -1.3217329978942871e-05, -1.1867843568325043e-05, -1.0518357157707214e-05, -9.168870747089386e-06, -7.819384336471558e-06, -6.469897925853729e-06, -5.120411515235901e-06, -3.7709251046180725e-06, -2.421438694000244e-06, -1.0719522833824158e-06, 2.775341272354126e-07, 1.627020537853241e-06, 2.9765069484710693e-06, 4.325993359088898e-06, 5.675479769706726e-06, 7.0249661803245544e-06, 8.374452590942383e-06, 9.723939001560211e-06, 1.107342541217804e-05, 1.2422911822795868e-05, 1.3772398233413696e-05, 1.5121884644031525e-05, 1.6471371054649353e-05, 1.782085746526718e-05, 1.917034387588501e-05, 2.0519830286502838e-05, 2.1869316697120667e-05, 2.3218803107738495e-05, 2.4568289518356323e-05, 2.591777592897415e-05, 2.726726233959198e-05, 2.861674875020981e-05, 2.9966235160827637e-05, 3.1315721571445465e-05, 3.2665207982063293e-05, 3.401469439268112e-05, 3.536418080329895e-05, 3.671366721391678e-05, 3.806315362453461e-05, 3.9412640035152435e-05, 4.0762126445770264e-05, 4.211161285638809e-05, 4.346109926700592e-05, 4.481058567762375e-05, 4.616007208824158e-05, 4.7509558498859406e-05, 4.8859044909477234e-05, 5.020853132009506e-05, 5.155801773071289e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 1.0, 7.0, 5.0, 7.0, 12.0, 13.0, 19.0, 24.0, 29.0, 39.0, 58.0, 79.0, 141.0, 153.0, 274.0, 447.0, 740.0, 1268.0, 2408.0, 4994.0, 10902.0, 28721.0, 120816.0, 773195.0, 67366.0, 20038.0, 8184.0, 3890.0, 1934.0, 1082.0, 601.0, 353.0, 240.0, 163.0, 96.0, 73.0, 48.0, 33.0, 28.0, 13.0, 16.0, 11.0, 18.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0308990478515625, -0.029880285263061523, -0.028861522674560547, -0.02784276008605957, -0.026823997497558594, -0.025805234909057617, -0.02478647232055664, -0.023767709732055664, -0.022748947143554688, -0.02173018455505371, -0.020711421966552734, -0.019692659378051758, -0.01867389678955078, -0.017655134201049805, -0.016636371612548828, -0.015617609024047852, -0.014598846435546875, -0.013580083847045898, -0.012561321258544922, -0.011542558670043945, -0.010523796081542969, -0.009505033493041992, -0.008486270904541016, -0.007467508316040039, -0.0064487457275390625, -0.005429983139038086, -0.004411220550537109, -0.003392457962036133, -0.0023736953735351562, -0.0013549327850341797, -0.0003361701965332031, 0.0006825923919677734, 0.00170135498046875, 0.0027201175689697266, 0.003738880157470703, 0.00475764274597168, 0.005776405334472656, 0.006795167922973633, 0.00781393051147461, 0.008832693099975586, 0.009851455688476562, 0.010870218276977539, 0.011888980865478516, 0.012907743453979492, 0.013926506042480469, 0.014945268630981445, 0.015964031219482422, 0.0169827938079834, 0.018001556396484375, 0.01902031898498535, 0.020039081573486328, 0.021057844161987305, 0.02207660675048828, 0.023095369338989258, 0.024114131927490234, 0.02513289451599121, 0.026151657104492188, 0.027170419692993164, 0.02818918228149414, 0.029207944869995117, 0.030226707458496094, 0.03124547004699707, 0.03226423263549805, 0.03328299522399902, 0.0343017578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 3.0, 3.0, 5.0, 10.0, 10.0, 9.0, 14.0, 12.0, 28.0, 32.0, 43.0, 79.0, 133.0, 171.0, 136.0, 96.0, 60.0, 46.0, 27.0, 11.0, 14.0, 13.0, 7.0, 8.0, 5.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.06182575225830078, -0.05980873107910156, -0.057791709899902344, -0.055774688720703125, -0.053757667541503906, -0.05174064636230469, -0.04972362518310547, -0.04770660400390625, -0.04568958282470703, -0.04367256164550781, -0.041655540466308594, -0.039638519287109375, -0.037621498107910156, -0.03560447692871094, -0.03358745574951172, -0.0315704345703125, -0.02955341339111328, -0.027536392211914062, -0.025519371032714844, -0.023502349853515625, -0.021485328674316406, -0.019468307495117188, -0.01745128631591797, -0.01543426513671875, -0.013417243957519531, -0.011400222778320312, -0.009383201599121094, -0.007366180419921875, -0.005349159240722656, -0.0033321380615234375, -0.0013151168823242188, 0.000701904296875, 0.0027189254760742188, 0.0047359466552734375, 0.006752967834472656, 0.008769989013671875, 0.010787010192871094, 0.012804031372070312, 0.014821052551269531, 0.01683807373046875, 0.01885509490966797, 0.020872116088867188, 0.022889137268066406, 0.024906158447265625, 0.026923179626464844, 0.028940200805664062, 0.03095722198486328, 0.0329742431640625, 0.03499126434326172, 0.03700828552246094, 0.039025306701660156, 0.041042327880859375, 0.043059349060058594, 0.04507637023925781, 0.04709339141845703, 0.04911041259765625, 0.05112743377685547, 0.05314445495605469, 0.055161476135253906, 0.057178497314453125, 0.059195518493652344, 0.06121253967285156, 0.06322956085205078, 0.06524658203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 13.0, 28.0, 39.0, 62.0, 156.0, 540.0, 77.0, 38.0, 16.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0018630027771, -4.896159648895264, -4.790456295013428, -4.684752464294434, -4.579049110412598, -4.473345756530762, -4.367642402648926, -4.26193904876709, -4.156235694885254, -4.050532341003418, -3.944828748703003, -3.839125394821167, -3.733421802520752, -3.627718448638916, -3.52201509475708, -3.416311740875244, -3.31060791015625, -3.204904556274414, -3.099200963973999, -2.993497610092163, -2.887794017791748, -2.782090663909912, -2.676387310028076, -2.5706839561462402, -2.464980363845825, -2.3592770099639893, -2.253573417663574, -2.1478700637817383, -2.0421667098999023, -1.9364631175994873, -1.8307597637176514, -1.7250562906265259, -1.6193530559539795, -1.513649582862854, -1.4079461097717285, -1.3022427558898926, -1.196539282798767, -1.0908358097076416, -0.9851323962211609, -0.8794289827346802, -0.7737255096435547, -0.6680220365524292, -0.5623186230659485, -0.4566151797771454, -0.3509117364883423, -0.2452082633972168, -0.13950484991073608, -0.03380143642425537, 0.07190203666687012, 0.17760547995567322, 0.2833089232444763, 0.3890123665332794, 0.4947158098220825, 0.600419282913208, 0.7061226963996887, 0.8118261098861694, 0.9175295829772949, 1.0232330560684204, 1.128936529159546, 1.2346398830413818, 1.3403433561325073, 1.4460468292236328, 1.5517501831054688, 1.6574536561965942, 1.7631571292877197]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 4.0, 1.0, 5.0, 3.0, 10.0, 7.0, 13.0, 11.0, 20.0, 14.0, 16.0, 19.0, 23.0, 33.0, 26.0, 37.0, 89.0, 324.0, 104.0, 26.0, 18.0, 21.0, 26.0, 23.0, 26.0, 23.0, 23.0, 8.0, 11.0, 6.0, 6.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5587775707244873, -2.4887776374816895, -2.4187777042388916, -2.3487777709960938, -2.278778076171875, -2.208778142929077, -2.1387782096862793, -2.0687782764434814, -1.9987783432006836, -1.9287784099578857, -1.858778476715088, -1.7887786626815796, -1.7187787294387817, -1.6487787961959839, -1.5787789821624756, -1.5087790489196777, -1.4387791156768799, -1.368779182434082, -1.2987792491912842, -1.2287794351577759, -1.158779501914978, -1.0887795686721802, -1.0187797546386719, -0.948779821395874, -0.8787798881530762, -0.8087799549102783, -0.7387800812721252, -0.6687802076339722, -0.5987802743911743, -0.5287803411483765, -0.4587804675102234, -0.3887805640697479, -0.31878089904785156, -0.2487809956073761, -0.17878109216690063, -0.10878118872642517, -0.03878128528594971, 0.031218618154525757, 0.10121852159500122, 0.17121842503547668, 0.24121832847595215, 0.3112182319164276, 0.3812181353569031, 0.45121803879737854, 0.521217942237854, 0.5912178754806519, 0.6612177491188049, 0.731217622756958, 0.8012175559997559, 0.8712174892425537, 0.9412173628807068, 1.0112172365188599, 1.0812171697616577, 1.1512171030044556, 1.2212169170379639, 1.2912168502807617, 1.3612167835235596, 1.4312167167663574, 1.5012166500091553, 1.5712164640426636, 1.6412163972854614, 1.7112163305282593, 1.7812161445617676, 1.8512160778045654, 1.9212160110473633]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 16.0, 22.0, 34.0, 37.0, 48.0, 70.0, 211.0, 260.0, 69.0, 59.0, 41.0, 33.0, 24.0, 23.0, 10.0, 9.0, 5.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.2168598175048828, -0.20654678344726562, -0.19623374938964844, -0.18592071533203125, -0.17560768127441406, -0.16529464721679688, -0.1549816131591797, -0.1446685791015625, -0.1343555450439453, -0.12404251098632812, -0.11372947692871094, -0.10341644287109375, -0.09310340881347656, -0.08279037475585938, -0.07247734069824219, -0.062164306640625, -0.05185127258300781, -0.041538238525390625, -0.031225204467773438, -0.02091217041015625, -0.010599136352539062, -0.000286102294921875, 0.010026931762695312, 0.0203399658203125, 0.030652999877929688, 0.040966033935546875, 0.05127906799316406, 0.06159210205078125, 0.07190513610839844, 0.08221817016601562, 0.09253120422363281, 0.10284423828125, 0.11315727233886719, 0.12347030639648438, 0.13378334045410156, 0.14409637451171875, 0.15440940856933594, 0.16472244262695312, 0.1750354766845703, 0.1853485107421875, 0.1956615447998047, 0.20597457885742188, 0.21628761291503906, 0.22660064697265625, 0.23691368103027344, 0.24722671508789062, 0.2575397491455078, 0.267852783203125, 0.2781658172607422, 0.2884788513183594, 0.29879188537597656, 0.30910491943359375, 0.31941795349121094, 0.3297309875488281, 0.3400440216064453, 0.3503570556640625, 0.3606700897216797, 0.3709831237792969, 0.38129615783691406, 0.39160919189453125, 0.40192222595214844, 0.4122352600097656, 0.4225482940673828, 0.432861328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 11.0, 10.0, 5.0, 16.0, 14.0, 20.0, 33.0, 24.0, 62.0, 171.0, 443.0, 2900.0, 8365785.0, 17554.0, 986.0, 260.0, 105.0, 52.0, 9.0, 10.0, 40.0, 14.0, 5.0, 18.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 5.0], "bins": [-3.53940749168396, -3.42431902885437, -3.3092308044433594, -3.1941423416137695, -3.079054117202759, -2.963965654373169, -2.848877429962158, -2.7337889671325684, -2.6187005043029785, -2.5036120414733887, -2.388523817062378, -2.273435354232788, -2.1583471298217773, -2.0432586669921875, -1.9281703233718872, -1.813081979751587, -1.6979937553405762, -1.5829054117202759, -1.4678170680999756, -1.3527286052703857, -1.237640380859375, -1.1225519180297852, -1.0074635744094849, -0.8923752307891846, -0.7772868871688843, -0.662198543548584, -0.5471101999282837, -0.4320217967033386, -0.31693345308303833, -0.20184510946273804, -0.08675670623779297, 0.028331637382507324, 0.14341998100280762, 0.2585083246231079, 0.3735966980457306, 0.48868507146835327, 0.6037734150886536, 0.7188617587089539, 0.8339501619338989, 0.9490385055541992, 1.0641268491744995, 1.1792151927947998, 1.2943035364151, 1.4093918800354004, 1.5244803428649902, 1.639568567276001, 1.7546570301055908, 1.8697453737258911, 1.9848337173461914, 2.0999221801757812, 2.215010404586792, 2.330098867416382, 2.4451870918273926, 2.5602755546569824, 2.6753640174865723, 2.790452241897583, 2.9055404663085938, 3.0206289291381836, 3.1357171535491943, 3.250805616378784, 3.365893840789795, 3.4809823036193848, 3.5960707664489746, 3.7111589908599854, 3.826247453689575]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 1.0, 11.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.611243963241577, -2.531331777572632, -2.4514195919036865, -2.3715076446533203, -2.291595458984375, -2.2116832733154297, -2.1317710876464844, -2.051858901977539, -1.9719469547271729, -1.8920347690582275, -1.8121227025985718, -1.7322105169296265, -1.6522984504699707, -1.5723862648010254, -1.49247407913208, -1.4125620126724243, -1.332649827003479, -1.2527376413345337, -1.172825574874878, -1.0929133892059326, -1.0130013227462769, -0.9330891370773315, -0.853177011013031, -0.7732648849487305, -0.6933527588844299, -0.6134406328201294, -0.5335285067558289, -0.45361635088920593, -0.3737042248249054, -0.29379209876060486, -0.21387994289398193, -0.1339678168296814, -0.05405569076538086, 0.025856442749500275, 0.10576857626438141, 0.18568071722984314, 0.2655928432941437, 0.3455049693584442, 0.42541712522506714, 0.5053292512893677, 0.5852413773536682, 0.6651535034179688, 0.7450656294822693, 0.8249777555465698, 0.9048899412155151, 0.9848020076751709, 1.0647141933441162, 1.1446263790130615, 1.2245384454727173, 1.3044506311416626, 1.3843626976013184, 1.4642748832702637, 1.5441869497299194, 1.6240991353988647, 1.7040112018585205, 1.7839233875274658, 1.8638355731964111, 1.9437477588653564, 2.0236599445343018, 2.103571891784668, 2.1834840774536133, 2.2633962631225586, 2.343308448791504, 2.423220634460449, 2.5031325817108154]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 17.0, 6.0, 28.0, 35.0, 44.0, 61.0, 96.0, 147.0, 211.0, 439.0, 1019.0, 3458.0, 15066.0, 86356.0, 302223.0, 93687.0, 15754.0, 3320.0, 1056.0, 464.0, 243.0, 163.0, 111.0, 71.0, 56.0, 33.0, 14.0, 20.0, 14.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.245391845703125, -2.18218994140625, -2.118988037109375, -2.0557861328125, -1.992584228515625, -1.92938232421875, -1.866180419921875, -1.802978515625, -1.739776611328125, -1.67657470703125, -1.613372802734375, -1.5501708984375, -1.486968994140625, -1.42376708984375, -1.360565185546875, -1.29736328125, -1.234161376953125, -1.17095947265625, -1.107757568359375, -1.0445556640625, -0.981353759765625, -0.91815185546875, -0.854949951171875, -0.791748046875, -0.728546142578125, -0.66534423828125, -0.602142333984375, -0.5389404296875, -0.475738525390625, -0.41253662109375, -0.349334716796875, -0.2861328125, -0.222930908203125, -0.15972900390625, -0.096527099609375, -0.0333251953125, 0.029876708984375, 0.09307861328125, 0.156280517578125, 0.219482421875, 0.282684326171875, 0.34588623046875, 0.409088134765625, 0.4722900390625, 0.535491943359375, 0.59869384765625, 0.661895751953125, 0.72509765625, 0.788299560546875, 0.85150146484375, 0.914703369140625, 0.9779052734375, 1.041107177734375, 1.10430908203125, 1.167510986328125, 1.230712890625, 1.293914794921875, 1.35711669921875, 1.420318603515625, 1.4835205078125, 1.546722412109375, 1.60992431640625, 1.673126220703125, 1.736328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 6.0, 8.0, 12.0, 18.0, 20.0, 38.0, 34.0, 41.0, 60.0, 62.0, 104.0, 112.0, 98.0, 99.0, 73.0, 51.0, 37.0, 19.0, 24.0, 23.0, 16.0, 10.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3095703125, -0.298492431640625, -0.28741455078125, -0.276336669921875, -0.2652587890625, -0.254180908203125, -0.24310302734375, -0.232025146484375, -0.220947265625, -0.209869384765625, -0.19879150390625, -0.187713623046875, -0.1766357421875, -0.165557861328125, -0.15447998046875, -0.143402099609375, -0.13232421875, -0.121246337890625, -0.11016845703125, -0.099090576171875, -0.0880126953125, -0.076934814453125, -0.06585693359375, -0.054779052734375, -0.043701171875, -0.032623291015625, -0.02154541015625, -0.010467529296875, 0.0006103515625, 0.011688232421875, 0.02276611328125, 0.033843994140625, 0.044921875, 0.055999755859375, 0.06707763671875, 0.078155517578125, 0.0892333984375, 0.100311279296875, 0.11138916015625, 0.122467041015625, 0.133544921875, 0.144622802734375, 0.15570068359375, 0.166778564453125, 0.1778564453125, 0.188934326171875, 0.20001220703125, 0.211090087890625, 0.22216796875, 0.233245849609375, 0.24432373046875, 0.255401611328125, 0.2664794921875, 0.277557373046875, 0.28863525390625, 0.299713134765625, 0.310791015625, 0.321868896484375, 0.33294677734375, 0.344024658203125, 0.3551025390625, 0.366180419921875, 0.37725830078125, 0.388336181640625, 0.3994140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 23.0, 37.0, 87.0, 102.0, 107.0, 54.0, 17.0, 18.0, 4.0, 7.0, 2.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6309139728546143, -1.5468950271606445, -1.4628762006759644, -1.3788572549819946, -1.294838309288025, -1.2108194828033447, -1.126800537109375, -1.0427815914154053, -0.9587627053260803, -0.8747438192367554, -0.7907248735427856, -0.7067059874534607, -0.6226871013641357, -0.538668155670166, -0.45464926958084106, -0.37063032388687134, -0.2866114377975464, -0.20259252190589905, -0.1185736209154129, -0.03455471992492676, 0.04946419596672058, 0.13348311185836792, 0.21750199794769287, 0.3015209436416626, 0.38553982973098755, 0.4695587456226349, 0.5535776615142822, 0.6375965476036072, 0.7216154336929321, 0.8056343793869019, 0.8896532654762268, 0.9736722111701965, 1.0576910972595215, 1.1417100429534912, 1.2257288694381714, 1.3097478151321411, 1.3937667608261108, 1.477785587310791, 1.5618045330047607, 1.6458234786987305, 1.7298424243927002, 1.81386137008667, 1.89788019657135, 1.9818991422653198, 2.06591796875, 2.1499369144439697, 2.2339558601379395, 2.317974805831909, 2.401993751525879, 2.4860126972198486, 2.5700316429138184, 2.654050350189209, 2.7380692958831787, 2.8220882415771484, 2.906107187271118, 2.990126132965088, 3.0741448402404785, 3.1581637859344482, 3.242182731628418, 3.3262014389038086, 3.4102203845977783, 3.494239330291748, 3.5782582759857178, 3.6622772216796875, 3.7462961673736572]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 9.0, 8.0, 13.0, 29.0, 44.0, 49.0, 68.0, 67.0, 78.0, 35.0, 15.0, 18.0, 14.0, 3.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.592702627182007, -2.52793288230896, -2.463163375854492, -2.3983936309814453, -2.3336238861083984, -2.2688541412353516, -2.204084634780884, -2.139314889907837, -2.074545383453369, -2.0097756385803223, -1.945006012916565, -1.8802363872528076, -1.8154666423797607, -1.7506970167160034, -1.685927391052246, -1.6211576461791992, -1.5563879013061523, -1.491618275642395, -1.4268485307693481, -1.3620789051055908, -1.297309160232544, -1.2325395345687866, -1.1677699089050293, -1.1030001640319824, -1.038230538368225, -0.973460853099823, -0.9086911678314209, -0.8439215421676636, -0.7791518568992615, -0.7143821716308594, -0.649612545967102, -0.5848428606987, -0.5200729370117188, -0.45530325174331665, -0.39053359627723694, -0.3257639408111572, -0.2609942555427551, -0.19622457027435303, -0.13145491480827332, -0.0666852593421936, -0.001915574073791504, 0.0628540962934494, 0.1276237666606903, 0.1923934370279312, 0.2571631073951721, 0.3219327926635742, 0.38670244812965393, 0.45147210359573364, 0.5162417888641357, 0.5810114741325378, 0.6457811594009399, 0.7105507850646973, 0.7753204703330994, 0.8400901556015015, 0.9048597812652588, 0.9696294665336609, 1.034399151802063, 1.0991687774658203, 1.1639385223388672, 1.2287081480026245, 1.2934777736663818, 1.3582475185394287, 1.423017144203186, 1.4877867698669434, 1.5525565147399902]}, "eval/loss": 4.183660507202148, "eval/wer": 2.4574970249900834, "eval/runtime": 936.4278, "eval/samples_per_second": 2.821, "eval/steps_per_second": 0.236, "train/train_runtime": 5718.4377, "train/train_samples_per_second": 4.991, "train/train_steps_per_second": 0.104, "train/total_flos": 0.0, "train/train_loss": 4.336673439953865} \ No newline at end of file